In [0]:
"""
We use following lines because we are running on Google Colab
If you are running notebook on a local computer, you don't need this cell
"""
from google.colab import drive
drive.mount('/content/gdrive')
import os
os.chdir('/content/gdrive/My Drive/finch/tensorflow1/semantic_parsing/tree_slu/main')
In [2]:
%tensorflow_version 1.x
!pip install tensorflow-hub
!pip install texar
Requirement already satisfied: tensorflow-hub in /usr/local/lib/python3.6/dist-packages (0.7.0)
Requirement already satisfied: protobuf>=3.4.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-hub) (3.10.0)
Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-hub) (1.12.0)
Requirement already satisfied: numpy>=1.12.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-hub) (1.17.4)
Requirement already satisfied: setuptools in /usr/local/lib/python3.6/dist-packages (from protobuf>=3.4.0->tensorflow-hub) (41.4.0)
Collecting texar
  Downloading https://files.pythonhosted.org/packages/f4/a7/c439f300fa7bc53a798e48da4896a62aa92053f93e78c160d74b6742531b/texar-0.2.3.tar.gz (260kB)
     |████████████████████████████████| 266kB 9.1MB/s 
Collecting numpy<1.17.0
  Downloading https://files.pythonhosted.org/packages/98/87/41283370f942f647422581eed16df4b653a744a3e9d5cfbb9aee0440f6eb/numpy-1.16.5-cp36-cp36m-manylinux1_x86_64.whl (17.4MB)
     |████████████████████████████████| 17.4MB 476kB/s 
Requirement already satisfied: pathlib>=1.0 in /usr/local/lib/python3.6/dist-packages (from texar) (1.0.1)
Requirement already satisfied: pyyaml in /usr/local/lib/python3.6/dist-packages (from texar) (3.13)
Requirement already satisfied: requests in /usr/local/lib/python3.6/dist-packages (from texar) (2.21.0)
Collecting funcsigs>=1.0.2
  Downloading https://files.pythonhosted.org/packages/69/cb/f5be453359271714c01b9bd06126eaf2e368f1fddfff30818754b5ac2328/funcsigs-1.0.2-py2.py3-none-any.whl
Requirement already satisfied: packaging in /usr/local/lib/python3.6/dist-packages (from texar) (19.2)
Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.6/dist-packages (from requests->texar) (2019.9.11)
Requirement already satisfied: chardet<3.1.0,>=3.0.2 in /usr/local/lib/python3.6/dist-packages (from requests->texar) (3.0.4)
Requirement already satisfied: idna<2.9,>=2.5 in /usr/local/lib/python3.6/dist-packages (from requests->texar) (2.8)
Requirement already satisfied: urllib3<1.25,>=1.21.1 in /usr/local/lib/python3.6/dist-packages (from requests->texar) (1.24.3)
Requirement already satisfied: pyparsing>=2.0.2 in /usr/local/lib/python3.6/dist-packages (from packaging->texar) (2.4.5)
Requirement already satisfied: six in /usr/local/lib/python3.6/dist-packages (from packaging->texar) (1.12.0)
Building wheels for collected packages: texar
  Building wheel for texar (setup.py) ... done
  Created wheel for texar: filename=texar-0.2.3-cp36-none-any.whl size=395469 sha256=72dcb299e89a8ce749a5a6e0bd527b2739205b8d6ad213b8f1f92aa96ab6fb76
  Stored in directory: /root/.cache/pip/wheels/a9/00/3d/b2c9a2c98e2102bb3fe24ebaa5bd09303fa392aab6f77d78e8
Successfully built texar
ERROR: datascience 0.10.6 has requirement folium==0.2.1, but you'll have folium 0.8.3 which is incompatible.
ERROR: albumentations 0.1.12 has requirement imgaug<0.2.7,>=0.2.5, but you'll have imgaug 0.2.9 which is incompatible.
Installing collected packages: numpy, funcsigs, texar
  Found existing installation: numpy 1.17.4
    Uninstalling numpy-1.17.4:
      Successfully uninstalled numpy-1.17.4
Successfully installed funcsigs-1.0.2 numpy-1.16.5 texar-0.2.3
In [3]:
import tensorflow as tf
import tensorflow_hub as hub
import texar.tf as tx

import numpy as np
import pprint
import logging
import time
import nltk

from texar.tf.modules import TransformerDecoder
from pathlib import Path

print("TensorFlow Version", tf.__version__)
print('GPU Enabled:', tf.test.is_gpu_available())
TensorFlow Version 1.15.0
GPU Enabled: True
In [0]:
# stream data from text files
def data_generator(f_path, params):
  with open(f_path) as f:
    print('Reading', f_path)
    for line in f:
      text_raw, text_tokenized, label = line.split('\t')
      text_tokenized = text_tokenized.lower().split()
      label = label.replace('[', '[ ').lower().split()
      #source = [params['tgt2idx'].get(w, len(params['tgt2idx'])) for w in text_tokenized]
      target = [params['tgt2idx'].get(w, len(params['tgt2idx'])) for w in label]
      target_in = [1] + target
      target_out = target + [2]
      yield (text_tokenized, (target_in, target_out))
In [0]:
def dataset(is_training, params):
  _shapes = ([None], ([None], [None]))
  _types = (tf.string, (tf.int32, tf.int32))
  _pads = ('<pad>', (0, 0))
  
  if is_training:
    ds = tf.data.Dataset.from_generator(
      lambda: data_generator(params['train_path'], params),
      output_shapes = _shapes,
      output_types = _types,)
    ds = ds.shuffle(params['buffer_size'])
    ds = ds.padded_batch(params['batch_size'], _shapes, _pads)
    ds = ds.repeat(10)
    ds = ds.prefetch(tf.data.experimental.AUTOTUNE)
  else:
    ds = tf.data.Dataset.from_generator(
      lambda: data_generator(params['test_path'], params),
      output_shapes = _shapes,
      output_types = _types,)
    ds = ds.padded_batch(4*params['batch_size'], _shapes, _pads)
    ds = ds.prefetch(tf.data.experimental.AUTOTUNE)
  
  return ds
In [0]:
def forward(raw_texts, labels, mode):
    vocab = tf.contrib.lookup.index_table_from_file(
        params['vocab_tgt_path'], num_oov_buckets=1)
    words = vocab.lookup(raw_texts)
    words_len = tf.count_nonzero(words, 1, dtype=tf.int32)
    
    is_training = (mode == tf.estimator.ModeKeys.TRAIN)
    batch_sz = tf.shape(words)[0]
    
    
    with tf.variable_scope('Embedding'):
        elmo = hub.Module("https://tfhub.dev/google/elmo/2", trainable=False)
        e = elmo(inputs={'tokens':raw_texts, 'sequence_len':words_len,}, signature="tokens", as_dict=True)['lstm_outputs1']
        e = tf.layers.dropout(e, params['dropout_rate'], training=is_training)
        e = tf.layers.dense(e, params['rnn_units'], params['activation'])
        
        embedding = tf.Variable(np.load('../vocab/word.npy'),
                                dtype=tf.float32,
                                name='glove')
        x = tf.nn.embedding_lookup(embedding, words)
        x = tf.concat((x, e), -1)
        x = tf.layers.dropout(x, params['dropout_rate'], training=is_training)
    
    
    with tf.variable_scope('Encoder'):
        t = tf.transpose(x, perm=[1, 0, 2])  # Need time-major
        lstm_cell_fw = tf.contrib.rnn.LSTMBlockFusedCell(params['rnn_units'])
        lstm_cell_bw = tf.contrib.rnn.LSTMBlockFusedCell(params['rnn_units'])
        lstm_cell_bw = tf.contrib.rnn.TimeReversedFusedRNN(lstm_cell_bw)
        o_fw, s_fw = lstm_cell_fw(t, dtype=tf.float32, sequence_length=words_len)
        o_bw, s_bw = lstm_cell_bw(t, dtype=tf.float32, sequence_length=words_len)
        enc_out = tf.concat([o_fw, o_bw], axis=-1)
        enc_out = tf.transpose(enc_out, perm=[1, 0, 2])
    
    embedding = tf.concat([tf.zeros(shape=[1, 300]), embedding[1:, :]], axis=0)
    pos_embedder = tx.modules.SinusoidsPositionEmbedder(
        position_size = params['max_dec_len'],
        hparams = config_model.position_embedder_hparams)
    
    with tf.variable_scope('Decoder'):
        decoder = TransformerDecoder(vocab_size=len(params['tgt2idx'])+1,
                                     output_layer=tf.transpose(embedding, (1, 0)),
                                     hparams=config_model.decoder)
        
        if is_training or (mode == tf.estimator.ModeKeys.EVAL):
            dec_inputs, dec_outputs = labels
            dec_seq_len = tf.count_nonzero(dec_inputs, 1, dtype=tf.int32)
            dec_inputs = tf.nn.embedding_lookup(embedding, dec_inputs)
            dec_inputs = (dec_inputs * config_model.hidden_dim ** 0.5) + pos_embedder(sequence_length=dec_seq_len)
            #dec_inputs = tf.layers.dropout(dec_inputs, params['dropout_rate'], training=is_training)

            outputs = decoder(
                memory=enc_out,
                memory_sequence_length=words_len,
                inputs=dec_inputs,
                decoding_strategy='train_greedy',
                mode=tf.estimator.ModeKeys.TRAIN
            )
            
            return outputs.logits
        else:
            start_tokens = tf.fill([batch_sz], 1)

            def _embedding_fn(x, y):
                x_w_embed = tf.nn.embedding_lookup(embedding, x)
                y_p_embed = pos_embedder(y)
                return x_w_embed * config_model.hidden_dim ** 0.5 + y_p_embed

            predictions = decoder(
                memory=enc_out,
                memory_sequence_length=words_len,
                beam_width=params['beam_width'],
                length_penalty=params['length_penalty'],
                start_tokens=start_tokens,
                end_token=2,
                embedding=_embedding_fn,
                max_decoding_length=params['max_dec_len'],
                mode=tf.estimator.ModeKeys.PREDICT)
            
            return predictions['sample_id'][:, :, 0]
In [0]:
def clip_grads(loss):
    variables = tf.trainable_variables()
    pprint.pprint(variables)
    grads = tf.gradients(loss, variables)
    clipped_grads, _ = tf.clip_by_global_norm(grads, params['clip_norm'])
    return zip(clipped_grads, variables)
In [0]:
def model_fn(features, labels, mode, params):
    logits_or_ids = forward(features, labels, mode)
    
    if mode == tf.estimator.ModeKeys.PREDICT:
        return tf.estimator.EstimatorSpec(mode, predictions=logits_or_ids)
    
    dec_inputs, dec_outputs = labels
    loss_op = tf.losses.softmax_cross_entropy(onehot_labels = tf.one_hot(dec_outputs, len(params['tgt2idx'])+1),
                                              logits = logits_or_ids,
                                              weights = tf.to_float(tf.sign(dec_outputs)),
                                              label_smoothing = .1)  
      
    if mode == tf.estimator.ModeKeys.TRAIN:
        global_step=tf.train.get_or_create_global_step()
        
        lr = tf.train.exponential_decay(
            params['lr'], global_step, 1000, .99)
        """
        lr = (2 * (params['rnn_units'] ** -0.5)) \
            * tf.math.minimum(1.0, tf.to_float(global_step / params['warmup_steps'])) \
            * (1 / tf.math.sqrt(tf.to_float(tf.math.maximum(global_step, params['warmup_steps']))))
        """
        train_op = tf.train.AdamOptimizer(lr).apply_gradients(
            clip_grads(loss_op), global_step=global_step)
        
        hook = tf.train.LoggingTensorHook({'lr': lr}, every_n_iter=100)
        
        return tf.estimator.EstimatorSpec(
            mode=mode, loss=loss_op, train_op=train_op, training_hooks=[hook],)
In [0]:
def get_vocab(f_path):
  word2idx = {}
  with open(f_path) as f:
    for i, line in enumerate(f):
      line = line.rstrip()
      word2idx[line] = i
  return word2idx
In [0]:
params = {
    'model_dir': '../model/lstm_transformer',
    'log_path': '../log/lstm_transformer.txt',
    'train_path': '../data/train.tsv',
    'test_path': '../data/test.tsv',
    'vocab_src_path': '../vocab/source.txt',
    'vocab_tgt_path': '../vocab/target.txt',
    'model_path': '../model/',
    'dropout_rate': 0.2,
    'rnn_units': 300,
    'beam_width': 5,
    'activation': tf.nn.relu,
    'lr': 4e-4,
    'clip_norm': 5.,
    'max_dec_len': 80,
    'length_penalty': .6,
    'buffer_size': 31279,
    'batch_size': 32,
    'num_patience': 5,
}


class config_model:
    hidden_dim = 300

    position_embedder_hparams = {
        'dim': hidden_dim
    }

    decoder = {
        'dim': hidden_dim,
        'num_blocks': 2,
        'multihead_attention': {
            'num_heads': 8,
            'output_dim': hidden_dim,
            'use_bias': True,
        },
        'initializer': {
            'type': 'variance_scaling_initializer',
            'kwargs': {
                'scale': 1.0,
                'mode': 'fan_avg',
                'distribution': 'uniform',
            },
        },
        'poswise_feedforward': tx.modules.default_transformer_poswise_net_hparams(
            output_dim=hidden_dim),
        'output_layer_bias': True,
    }
In [0]:
params['tgt2idx'] = get_vocab(params['vocab_tgt_path'])
params['idx2tgt'] = {idx: tgt for tgt, idx in params['tgt2idx'].items()}
In [0]:
def is_descending(history: list) -> bool:
  history = history[-(params['num_patience']+1):]
  for i in range(1, len(history)):
    if history[i-1] <= history[i]:
      return False
  return True  
In [0]:
def minimal_test(estimator):
  test_str = [['what', 'times', 'are', 'the', 'nutcracker', 'show', 'playing', 'near', 'me']]
  predicted = list(estimator.predict(tf.estimator.inputs.numpy_input_fn(
    x = np.array(test_str), shuffle = False)))
  print('-'*12)
  print('minimal test')
  print('utterance:', ' '.join(test_str[0]))
  predicted = ' '.join([params['idx2tgt'].get(idx, len(params['idx2tgt'])) for idx in predicted[0]])
  predicted = predicted.replace('<end>', '').replace('<pad>', '').strip()
  print('parsed:', predicted)
  print()
  try:
    nltk.tree.Tree.fromstring(predicted.replace('[ ', '(').replace(' ]', ')')).pretty_print()
  except:
    pass
  print('-'*12)
In [0]:
# Create directory if not exist
Path(os.path.dirname(params['log_path'])).mkdir(exist_ok=True)
Path(params['model_dir']).mkdir(exist_ok=True, parents=True)

# Logging
logger = logging.getLogger('tensorflow')
logger.propagate = False
logger.setLevel(logging.INFO)
fh = logging.FileHandler(params['log_path'])
logger.addHandler(fh)

# Create an estimator
eval_steps = 10 * (params['buffer_size']//params['batch_size'] + 1)
estimator = tf.estimator.Estimator(
  model_fn=model_fn,
  model_dir=params['model_dir'],
  config=tf.estimator.RunConfig(save_checkpoints_steps=eval_steps),
  params=params)

best_acc = .0
history_acc = []
tf.enable_eager_execution()

while True:
  estimator.train(input_fn=lambda: dataset(is_training=True, params=params))

  minimal_test(estimator)

  # Evaluation
  labels = [label for _, (_, label) in dataset(is_training=False, params=params)]
  seq_lens = [tf.argmax(tf.cast(tf.equal(l, 2), tf.int32), axis=1) for l in labels]
  labels = [j for i in labels for j in i.numpy()]
  seq_lens = [j for i in seq_lens for j in i.numpy()]

  preds = list(estimator.predict(input_fn=lambda: dataset(is_training=False, params=params)))

  assert len(preds) == len(labels)

  res = [np.all(p[:seq_len+1] == l[:seq_len+1]) for p, l, seq_len in zip(preds, labels, seq_lens)]
  acc = np.asarray(res).mean()
  logger.info("Evaluation: Testing (Exact Match) Accuracy: {:.3f}".format(acc))
  history_acc.append(acc)

  if acc > best_acc:
    best_acc = acc
  logger.info("Best (Exact Match) Accuracy: {:.3f}".format(best_acc))

  if len(history_acc) > params['num_patience'] and is_descending(history_acc):
    logger.info("Testing (Exact Match) Accuracy not improved over {} epochs, Early Stop".format(params['num_patience']))
    break
INFO:tensorflow:Using config: {'_model_dir': '../model/lstm_transformer', '_tf_random_seed': None, '_save_summary_steps': 100, '_save_checkpoints_steps': 9780, '_save_checkpoints_secs': None, '_session_config': allow_soft_placement: true
graph_options {
  rewrite_options {
    meta_optimizer_iterations: ONE
  }
}
, '_keep_checkpoint_max': 5, '_keep_checkpoint_every_n_hours': 10000, '_log_step_count_steps': 100, '_train_distribute': None, '_device_fn': None, '_protocol': None, '_eval_distribute': None, '_experimental_distribute': None, '_experimental_max_worker_delay_secs': None, '_session_creation_timeout_secs': 7200, '_service': None, '_cluster_spec': <tensorflow.python.training.server_lib.ClusterSpec object at 0x7fb3bb75b710>, '_task_type': 'worker', '_task_id': 0, '_global_id_in_cluster': 0, '_master': '', '_evaluation_master': '', '_is_chief': True, '_num_ps_replicas': 0, '_num_worker_replicas': 1}
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/training/training_util.py:236: Variable.initialized_value (from tensorflow.python.ops.variables) is deprecated and will be removed in a future version.
Instructions for updating:
Use Variable.read_value. Variables in 2.X are initialized automatically both in eager and graph (inside tf.defun) contexts.
INFO:tensorflow:Calling model_fn.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/util/deprecation.py:507: calling count_nonzero (from tensorflow.python.ops.math_ops) with axis is deprecated and will be removed in a future version.
Instructions for updating:
reduction_indices is deprecated, use axis instead
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
WARNING:tensorflow:From <ipython-input-6-34bae373cd3f>:14: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.
Instructions for updating:
Use keras.layers.dropout instead.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/layers/core.py:271: Layer.apply (from tensorflow.python.keras.engine.base_layer) is deprecated and will be removed in a future version.
Instructions for updating:
Please use `layer.__call__` method instead.
WARNING:tensorflow:From <ipython-input-6-34bae373cd3f>:15: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.
Instructions for updating:
Use keras.layers.Dense instead.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/contrib/rnn/python/ops/lstm_ops.py:597: Layer.add_variable (from tensorflow.python.keras.engine.base_layer) is deprecated and will be removed in a future version.
Instructions for updating:
Please use `layer.add_weight` method instead.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/module_base.py:72: The name tf.make_template is deprecated. Please use tf.compat.v1.make_template instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/modules/embedders/position_embedders.py:345: The name tf.mod is deprecated. Please use tf.math.mod instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/modules/decoders/transformer_decoders.py:103: The name tf.get_variable_scope is deprecated. Please use tf.compat.v1.get_variable_scope instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/modules/decoders/rnn_decoder_base.py:57: The name tf.get_variable is deprecated. Please use tf.compat.v1.get_variable instead.

WARNING:tensorflow:From /usr/lib/python3.6/pydoc.py:1595: The name tf.layers.Dense is deprecated. Please use tf.compat.v1.layers.Dense instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/core/layers.py:600: The name tf.layers.Layer is deprecated. Please use tf.compat.v1.layers.Layer instead.

WARNING:tensorflow:From /usr/lib/python3.6/pydoc.py:1595: The name tf.layers.Dropout is deprecated. Please use tf.compat.v1.layers.Dropout instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/utils/transformer_attentions.py:105: The name tf.matrix_band_part is deprecated. Please use tf.linalg.band_part instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/modules/decoders/transformer_decoders.py:612: The name tf.AUTO_REUSE is deprecated. Please use tf.compat.v1.AUTO_REUSE instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/module_base.py:129: The name tf.get_collection is deprecated. Please use tf.compat.v1.get_collection instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/module_base.py:130: The name tf.GraphKeys is deprecated. Please use tf.compat.v1.GraphKeys instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/context.py:52: The name tf.get_collection_ref is deprecated. Please use tf.compat.v1.get_collection_ref instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/context.py:55: The name tf.placeholder_with_default is deprecated. Please use tf.compat.v1.placeholder_with_default instead.

WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/texar/tf/modules/networks/network_base.py:123: The name tf.layers.BatchNormalization is deprecated. Please use tf.compat.v1.layers.BatchNormalization instead.

WARNING:tensorflow:From <ipython-input-8-46a022234050>:10: to_float (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.
Instructions for updating:
Use `tf.cast` instead.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/ops/losses/losses_impl.py:121: where (from tensorflow.python.ops.array_ops) is deprecated and will be removed in a future version.
Instructions for updating:
Use tf.where in 2.0, which has the same broadcast rule as np.where
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 0 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 59.033955, step = 0
INFO:tensorflow:lr = 0.0004
INFO:tensorflow:global_step/sec: 9.45219
INFO:tensorflow:loss = 5.0954924, step = 100 (10.586 sec)
INFO:tensorflow:lr = 0.00039959815 (10.582 sec)
INFO:tensorflow:global_step/sec: 11.9891
INFO:tensorflow:loss = 4.4737344, step = 200 (8.342 sec)
INFO:tensorflow:lr = 0.00039919675 (8.342 sec)
INFO:tensorflow:global_step/sec: 12.0835
INFO:tensorflow:loss = 4.20246, step = 300 (8.271 sec)
INFO:tensorflow:lr = 0.00039879576 (8.272 sec)
INFO:tensorflow:global_step/sec: 12.1546
INFO:tensorflow:loss = 4.0485344, step = 400 (8.226 sec)
INFO:tensorflow:lr = 0.00039839515 (8.226 sec)
INFO:tensorflow:global_step/sec: 12.4508
INFO:tensorflow:loss = 3.9781508, step = 500 (8.034 sec)
INFO:tensorflow:lr = 0.00039799497 (8.033 sec)
INFO:tensorflow:global_step/sec: 12.4297
INFO:tensorflow:loss = 3.8139787, step = 600 (8.042 sec)
INFO:tensorflow:lr = 0.00039759517 (8.042 sec)
INFO:tensorflow:global_step/sec: 12.1124
INFO:tensorflow:loss = 3.5685873, step = 700 (8.262 sec)
INFO:tensorflow:lr = 0.00039719575 (8.262 sec)
INFO:tensorflow:global_step/sec: 12.1605
INFO:tensorflow:loss = 3.525229, step = 800 (8.222 sec)
INFO:tensorflow:lr = 0.0003967968 (8.221 sec)
INFO:tensorflow:global_step/sec: 12.0023
INFO:tensorflow:loss = 3.318803, step = 900 (8.334 sec)
INFO:tensorflow:lr = 0.0003963982 (8.334 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.02963
INFO:tensorflow:loss = 3.2519212, step = 1000 (12.453 sec)
INFO:tensorflow:lr = 0.00039599996 (12.454 sec)
INFO:tensorflow:global_step/sec: 12.1495
INFO:tensorflow:loss = 3.045715, step = 1100 (8.232 sec)
INFO:tensorflow:lr = 0.0003956022 (8.231 sec)
INFO:tensorflow:global_step/sec: 12.0573
INFO:tensorflow:loss = 3.4412713, step = 1200 (8.294 sec)
INFO:tensorflow:lr = 0.00039520478 (8.294 sec)
INFO:tensorflow:global_step/sec: 12.0834
INFO:tensorflow:loss = 2.9590592, step = 1300 (8.273 sec)
INFO:tensorflow:lr = 0.0003948078 (8.275 sec)
INFO:tensorflow:global_step/sec: 12.2286
INFO:tensorflow:loss = 2.948428, step = 1400 (8.179 sec)
INFO:tensorflow:lr = 0.0003944112 (8.178 sec)
INFO:tensorflow:global_step/sec: 12.4073
INFO:tensorflow:loss = 2.8570395, step = 1500 (8.061 sec)
INFO:tensorflow:lr = 0.00039401502 (8.059 sec)
INFO:tensorflow:global_step/sec: 12.1437
INFO:tensorflow:loss = 2.8721683, step = 1600 (8.229 sec)
INFO:tensorflow:lr = 0.0003936192 (8.230 sec)
INFO:tensorflow:global_step/sec: 12.4888
INFO:tensorflow:loss = 2.6866806, step = 1700 (8.007 sec)
INFO:tensorflow:lr = 0.00039322383 (8.006 sec)
INFO:tensorflow:global_step/sec: 12.2946
INFO:tensorflow:loss = 2.5551322, step = 1800 (8.134 sec)
INFO:tensorflow:lr = 0.0003928288 (8.134 sec)
INFO:tensorflow:global_step/sec: 12.5544
INFO:tensorflow:loss = 2.6697116, step = 1900 (7.965 sec)
INFO:tensorflow:lr = 0.0003924342 (7.966 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.853
INFO:tensorflow:loss = 2.5178728, step = 2000 (12.740 sec)
INFO:tensorflow:lr = 0.00039203998 (12.739 sec)
INFO:tensorflow:global_step/sec: 12.1408
INFO:tensorflow:loss = 2.506233, step = 2100 (8.235 sec)
INFO:tensorflow:lr = 0.00039164617 (8.235 sec)
INFO:tensorflow:global_step/sec: 12.46
INFO:tensorflow:loss = 2.2534523, step = 2200 (8.026 sec)
INFO:tensorflow:lr = 0.00039125275 (8.027 sec)
INFO:tensorflow:global_step/sec: 12.586
INFO:tensorflow:loss = 2.0285623, step = 2300 (7.941 sec)
INFO:tensorflow:lr = 0.00039085973 (7.940 sec)
INFO:tensorflow:global_step/sec: 12.5412
INFO:tensorflow:loss = 2.0797236, step = 2400 (7.973 sec)
INFO:tensorflow:lr = 0.00039046712 (7.973 sec)
INFO:tensorflow:global_step/sec: 12.8519
INFO:tensorflow:loss = 2.145553, step = 2500 (7.787 sec)
INFO:tensorflow:lr = 0.00039007486 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.394
INFO:tensorflow:loss = 1.9565487, step = 2600 (8.063 sec)
INFO:tensorflow:lr = 0.00038968303 (8.064 sec)
INFO:tensorflow:global_step/sec: 12.363
INFO:tensorflow:loss = 2.0215652, step = 2700 (8.096 sec)
INFO:tensorflow:lr = 0.00038929158 (8.095 sec)
INFO:tensorflow:global_step/sec: 12.4914
INFO:tensorflow:loss = 2.0743313, step = 2800 (7.998 sec)
INFO:tensorflow:lr = 0.00038890052 (8.002 sec)
INFO:tensorflow:global_step/sec: 12.6555
INFO:tensorflow:loss = 1.9481674, step = 2900 (7.907 sec)
INFO:tensorflow:lr = 0.00038850983 (7.903 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.19896
INFO:tensorflow:loss = 1.8079375, step = 3000 (12.195 sec)
INFO:tensorflow:lr = 0.0003881196 (12.195 sec)
INFO:tensorflow:global_step/sec: 12.647
INFO:tensorflow:loss = 1.858728, step = 3100 (7.910 sec)
INFO:tensorflow:lr = 0.0003877297 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.7231
INFO:tensorflow:loss = 1.7418987, step = 3200 (7.853 sec)
INFO:tensorflow:lr = 0.00038734023 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.633
INFO:tensorflow:loss = 1.8075138, step = 3300 (7.915 sec)
INFO:tensorflow:lr = 0.00038695114 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.6876
INFO:tensorflow:loss = 1.9535941, step = 3400 (7.886 sec)
INFO:tensorflow:lr = 0.00038656246 (7.886 sec)
INFO:tensorflow:global_step/sec: 12.8031
INFO:tensorflow:loss = 1.7075312, step = 3500 (7.807 sec)
INFO:tensorflow:lr = 0.00038617416 (7.808 sec)
INFO:tensorflow:global_step/sec: 12.5066
INFO:tensorflow:loss = 1.8058743, step = 3600 (7.997 sec)
INFO:tensorflow:lr = 0.0003857862 (7.996 sec)
INFO:tensorflow:global_step/sec: 12.8845
INFO:tensorflow:loss = 1.6459893, step = 3700 (7.764 sec)
INFO:tensorflow:lr = 0.00038539866 (7.764 sec)
INFO:tensorflow:global_step/sec: 12.6028
INFO:tensorflow:loss = 1.8697182, step = 3800 (7.930 sec)
INFO:tensorflow:lr = 0.00038501152 (7.930 sec)
INFO:tensorflow:global_step/sec: 12.6564
INFO:tensorflow:loss = 1.7144407, step = 3900 (7.904 sec)
INFO:tensorflow:lr = 0.00038462476 (7.905 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.39316
INFO:tensorflow:loss = 1.6077055, step = 4000 (11.917 sec)
INFO:tensorflow:lr = 0.0003842384 (11.915 sec)
INFO:tensorflow:global_step/sec: 12.8114
INFO:tensorflow:loss = 1.6767513, step = 4100 (7.804 sec)
INFO:tensorflow:lr = 0.00038385243 (7.808 sec)
INFO:tensorflow:global_step/sec: 12.63
INFO:tensorflow:loss = 1.6651752, step = 4200 (7.919 sec)
INFO:tensorflow:lr = 0.00038346683 (7.915 sec)
INFO:tensorflow:global_step/sec: 12.8231
INFO:tensorflow:loss = 1.574295, step = 4300 (7.798 sec)
INFO:tensorflow:lr = 0.00038308164 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.4846
INFO:tensorflow:loss = 1.6911457, step = 4400 (8.006 sec)
INFO:tensorflow:lr = 0.00038269683 (8.009 sec)
INFO:tensorflow:global_step/sec: 12.6322
INFO:tensorflow:loss = 1.6363447, step = 4500 (7.920 sec)
INFO:tensorflow:lr = 0.0003823124 (7.917 sec)
INFO:tensorflow:global_step/sec: 12.8063
INFO:tensorflow:loss = 1.7158389, step = 4600 (7.804 sec)
INFO:tensorflow:lr = 0.00038192834 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.6763
INFO:tensorflow:loss = 1.6156652, step = 4700 (7.889 sec)
INFO:tensorflow:lr = 0.00038154467 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.1828
INFO:tensorflow:loss = 1.4845752, step = 4800 (8.208 sec)
INFO:tensorflow:lr = 0.0003811614 (8.207 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.4912
INFO:tensorflow:loss = 1.6173213, step = 4900 (11.777 sec)
INFO:tensorflow:lr = 0.0003807785 (11.777 sec)
INFO:tensorflow:global_step/sec: 12.9355
INFO:tensorflow:loss = 1.5071679, step = 5000 (7.735 sec)
INFO:tensorflow:lr = 0.00038039603 (7.736 sec)
INFO:tensorflow:global_step/sec: 12.8336
INFO:tensorflow:loss = 1.5181412, step = 5100 (7.788 sec)
INFO:tensorflow:lr = 0.0003800139 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.678
INFO:tensorflow:loss = 1.6296129, step = 5200 (7.890 sec)
INFO:tensorflow:lr = 0.00037963217 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.4484
INFO:tensorflow:loss = 1.5062387, step = 5300 (8.033 sec)
INFO:tensorflow:lr = 0.00037925082 (8.031 sec)
INFO:tensorflow:global_step/sec: 12.8709
INFO:tensorflow:loss = 1.4886248, step = 5400 (7.771 sec)
INFO:tensorflow:lr = 0.00037886985 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.6909
INFO:tensorflow:loss = 1.4882165, step = 5500 (7.874 sec)
INFO:tensorflow:lr = 0.00037848923 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.6324
INFO:tensorflow:loss = 1.48171, step = 5600 (7.917 sec)
INFO:tensorflow:lr = 0.00037810905 (7.913 sec)
INFO:tensorflow:global_step/sec: 12.8959
INFO:tensorflow:loss = 1.5500232, step = 5700 (7.757 sec)
INFO:tensorflow:lr = 0.00037772924 (7.757 sec)
INFO:tensorflow:global_step/sec: 12.8081
INFO:tensorflow:loss = 1.4949408, step = 5800 (7.809 sec)
INFO:tensorflow:lr = 0.0003773498 (7.808 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.87373
INFO:tensorflow:loss = 1.5293541, step = 5900 (11.270 sec)
INFO:tensorflow:lr = 0.00037697077 (11.272 sec)
INFO:tensorflow:global_step/sec: 12.9509
INFO:tensorflow:loss = 1.5244159, step = 6000 (7.716 sec)
INFO:tensorflow:lr = 0.00037659207 (7.717 sec)
INFO:tensorflow:global_step/sec: 12.8297
INFO:tensorflow:loss = 1.4912233, step = 6100 (7.795 sec)
INFO:tensorflow:lr = 0.00037621378 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.8172
INFO:tensorflow:loss = 1.4585661, step = 6200 (7.803 sec)
INFO:tensorflow:lr = 0.00037583587 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.8078
INFO:tensorflow:loss = 1.4709327, step = 6300 (7.807 sec)
INFO:tensorflow:lr = 0.00037545833 (7.810 sec)
INFO:tensorflow:global_step/sec: 12.768
INFO:tensorflow:loss = 1.5252771, step = 6400 (7.836 sec)
INFO:tensorflow:lr = 0.00037508114 (7.834 sec)
INFO:tensorflow:global_step/sec: 12.4801
INFO:tensorflow:loss = 1.4626974, step = 6500 (8.016 sec)
INFO:tensorflow:lr = 0.00037470434 (8.015 sec)
INFO:tensorflow:global_step/sec: 12.4797
INFO:tensorflow:loss = 1.4680932, step = 6600 (8.011 sec)
INFO:tensorflow:lr = 0.00037432797 (8.011 sec)
INFO:tensorflow:global_step/sec: 12.6182
INFO:tensorflow:loss = 1.4867874, step = 6700 (7.920 sec)
INFO:tensorflow:lr = 0.00037395195 (7.921 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.7869
INFO:tensorflow:loss = 1.5120995, step = 6800 (8.494 sec)
INFO:tensorflow:lr = 0.0003735763 (8.497 sec)
INFO:tensorflow:global_step/sec: 10.8646
INFO:tensorflow:loss = 1.5093869, step = 6900 (9.195 sec)
INFO:tensorflow:lr = 0.00037320104 (9.192 sec)
INFO:tensorflow:global_step/sec: 12.6021
INFO:tensorflow:loss = 1.4627079, step = 7000 (7.934 sec)
INFO:tensorflow:lr = 0.00037282615 (7.938 sec)
INFO:tensorflow:global_step/sec: 12.4589
INFO:tensorflow:loss = 1.4051437, step = 7100 (8.026 sec)
INFO:tensorflow:lr = 0.00037245164 (8.022 sec)
INFO:tensorflow:global_step/sec: 12.9606
INFO:tensorflow:loss = 1.4104779, step = 7200 (7.716 sec)
INFO:tensorflow:lr = 0.0003720775 (7.716 sec)
INFO:tensorflow:global_step/sec: 12.5317
INFO:tensorflow:loss = 1.4525088, step = 7300 (7.979 sec)
INFO:tensorflow:lr = 0.00037170373 (7.980 sec)
INFO:tensorflow:global_step/sec: 12.8884
INFO:tensorflow:loss = 1.4862131, step = 7400 (7.763 sec)
INFO:tensorflow:lr = 0.00037133033 (7.763 sec)
INFO:tensorflow:global_step/sec: 12.3808
INFO:tensorflow:loss = 1.4874706, step = 7500 (8.079 sec)
INFO:tensorflow:lr = 0.0003709573 (8.078 sec)
INFO:tensorflow:global_step/sec: 12.6027
INFO:tensorflow:loss = 1.4101737, step = 7600 (7.931 sec)
INFO:tensorflow:lr = 0.0003705847 (7.935 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.5763
INFO:tensorflow:loss = 1.4103632, step = 7700 (7.951 sec)
INFO:tensorflow:lr = 0.00037021242 (7.948 sec)
INFO:tensorflow:global_step/sec: 11.0486
INFO:tensorflow:loss = 1.4301885, step = 7800 (9.050 sec)
INFO:tensorflow:lr = 0.00036984053 (9.049 sec)
INFO:tensorflow:global_step/sec: 12.9262
INFO:tensorflow:loss = 1.4219362, step = 7900 (7.738 sec)
INFO:tensorflow:lr = 0.00036946902 (7.743 sec)
INFO:tensorflow:global_step/sec: 12.6925
INFO:tensorflow:loss = 1.4855167, step = 8000 (7.877 sec)
INFO:tensorflow:lr = 0.0003690979 (7.872 sec)
INFO:tensorflow:global_step/sec: 12.5745
INFO:tensorflow:loss = 1.3784947, step = 8100 (7.956 sec)
INFO:tensorflow:lr = 0.00036872714 (7.956 sec)
INFO:tensorflow:global_step/sec: 12.545
INFO:tensorflow:loss = 1.4119531, step = 8200 (7.970 sec)
INFO:tensorflow:lr = 0.0003683567 (7.971 sec)
INFO:tensorflow:global_step/sec: 12.5777
INFO:tensorflow:loss = 1.4218488, step = 8300 (7.949 sec)
INFO:tensorflow:lr = 0.00036798668 (7.950 sec)
INFO:tensorflow:global_step/sec: 12.7638
INFO:tensorflow:loss = 1.4013296, step = 8400 (7.835 sec)
INFO:tensorflow:lr = 0.00036761703 (7.833 sec)
INFO:tensorflow:global_step/sec: 12.6604
INFO:tensorflow:loss = 1.3762985, step = 8500 (7.900 sec)
INFO:tensorflow:lr = 0.00036724776 (7.900 sec)
INFO:tensorflow:global_step/sec: 13.0189
INFO:tensorflow:loss = 1.4109349, step = 8600 (7.682 sec)
INFO:tensorflow:lr = 0.00036687887 (7.683 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.6167
INFO:tensorflow:loss = 1.4246565, step = 8700 (8.613 sec)
INFO:tensorflow:lr = 0.0003665103 (8.619 sec)
INFO:tensorflow:global_step/sec: 11.3619
INFO:tensorflow:loss = 1.3846593, step = 8800 (8.798 sec)
INFO:tensorflow:lr = 0.00036614214 (8.791 sec)
INFO:tensorflow:global_step/sec: 12.544
INFO:tensorflow:loss = 1.4037898, step = 8900 (7.972 sec)
INFO:tensorflow:lr = 0.00036577435 (7.972 sec)
INFO:tensorflow:global_step/sec: 12.6411
INFO:tensorflow:loss = 1.4317508, step = 9000 (7.911 sec)
INFO:tensorflow:lr = 0.00036540694 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.762
INFO:tensorflow:loss = 1.4514229, step = 9100 (7.842 sec)
INFO:tensorflow:lr = 0.00036503986 (7.842 sec)
INFO:tensorflow:global_step/sec: 12.8531
INFO:tensorflow:loss = 1.3912779, step = 9200 (7.773 sec)
INFO:tensorflow:lr = 0.00036467315 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.6416
INFO:tensorflow:loss = 1.4078438, step = 9300 (7.910 sec)
INFO:tensorflow:lr = 0.00036430682 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.7305
INFO:tensorflow:loss = 1.3546025, step = 9400 (7.854 sec)
INFO:tensorflow:lr = 0.00036394087 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.6416
INFO:tensorflow:loss = 1.376714, step = 9500 (7.913 sec)
INFO:tensorflow:lr = 0.0003635753 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.5347
INFO:tensorflow:loss = 1.3942187, step = 9600 (7.973 sec)
INFO:tensorflow:lr = 0.00036321007 (7.973 sec)
INFO:tensorflow:global_step/sec: 13.0655
INFO:tensorflow:loss = 1.3802559, step = 9700 (7.654 sec)
INFO:tensorflow:lr = 0.00036284523 (7.654 sec)
INFO:tensorflow:Saving checkpoints for 9780 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.3757502.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_estimator/python/estimator/inputs/queues/feeding_queue_runner.py:62: QueueRunner.__init__ (from tensorflow.python.training.queue_runner_impl) is deprecated and will be removed in a future version.
Instructions for updating:
To construct input pipelines, use the `tf.data` module.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_estimator/python/estimator/inputs/queues/feeding_functions.py:500: add_queue_runner (from tensorflow.python.training.queue_runner_impl) is deprecated and will be removed in a future version.
Instructions for updating:
To construct input pipelines, use the `tf.data` module.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-9780
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/training/monitored_session.py:882: start_queue_runners (from tensorflow.python.training.queue_runner_impl) is deprecated and will be removed in a future version.
Instructions for updating:
To construct input pipelines, use the `tf.data` module.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-9780
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.614
INFO:tensorflow:Best (Exact Match) Accuracy: 0.614
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-9780
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/training/saver.py:1069: get_checkpoint_mtimes (from tensorflow.python.training.checkpoint_management) is deprecated and will be removed in a future version.
Instructions for updating:
Use standard file utilities to get mtimes.
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 9780 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.3950752, step = 9780
INFO:tensorflow:lr = 0.00036255358
INFO:tensorflow:global_step/sec: 9.89531
INFO:tensorflow:loss = 1.38784, step = 9880 (10.114 sec)
INFO:tensorflow:lr = 0.0003621894 (10.114 sec)
INFO:tensorflow:global_step/sec: 12.511
INFO:tensorflow:loss = 1.3594651, step = 9980 (7.991 sec)
INFO:tensorflow:lr = 0.00036182557 (7.986 sec)
INFO:tensorflow:global_step/sec: 12.6818
INFO:tensorflow:loss = 1.3496534, step = 10080 (7.885 sec)
INFO:tensorflow:lr = 0.0003614621 (7.885 sec)
INFO:tensorflow:global_step/sec: 12.8195
INFO:tensorflow:loss = 1.3859842, step = 10180 (7.800 sec)
INFO:tensorflow:lr = 0.00036109902 (7.801 sec)
INFO:tensorflow:global_step/sec: 12.7904
INFO:tensorflow:loss = 1.4064968, step = 10280 (7.821 sec)
INFO:tensorflow:lr = 0.0003607363 (7.820 sec)
INFO:tensorflow:global_step/sec: 12.9878
INFO:tensorflow:loss = 1.3514677, step = 10380 (7.697 sec)
INFO:tensorflow:lr = 0.00036037393 (7.697 sec)
INFO:tensorflow:global_step/sec: 12.7001
INFO:tensorflow:loss = 1.3718523, step = 10480 (7.877 sec)
INFO:tensorflow:lr = 0.0003600119 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.4932
INFO:tensorflow:loss = 1.3550223, step = 10580 (8.002 sec)
INFO:tensorflow:lr = 0.00035965024 (8.002 sec)
INFO:tensorflow:global_step/sec: 12.7582
INFO:tensorflow:loss = 1.3919998, step = 10680 (7.836 sec)
INFO:tensorflow:lr = 0.00035928897 (7.834 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.20005
INFO:tensorflow:loss = 1.3931295, step = 10780 (12.198 sec)
INFO:tensorflow:lr = 0.00035892805 (12.199 sec)
INFO:tensorflow:global_step/sec: 12.7685
INFO:tensorflow:loss = 1.3510262, step = 10880 (7.829 sec)
INFO:tensorflow:lr = 0.00035856751 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.7663
INFO:tensorflow:loss = 1.398536, step = 10980 (7.836 sec)
INFO:tensorflow:lr = 0.00035820733 (7.836 sec)
INFO:tensorflow:global_step/sec: 12.6607
INFO:tensorflow:loss = 1.3688757, step = 11080 (7.898 sec)
INFO:tensorflow:lr = 0.0003578475 (7.898 sec)
INFO:tensorflow:global_step/sec: 12.846
INFO:tensorflow:loss = 1.3669326, step = 11180 (7.786 sec)
INFO:tensorflow:lr = 0.00035748802 (7.785 sec)
INFO:tensorflow:global_step/sec: 13.0049
INFO:tensorflow:loss = 1.3798718, step = 11280 (7.688 sec)
INFO:tensorflow:lr = 0.0003571289 (7.689 sec)
INFO:tensorflow:global_step/sec: 12.5146
INFO:tensorflow:loss = 1.361347, step = 11380 (7.987 sec)
INFO:tensorflow:lr = 0.0003567702 (7.988 sec)
INFO:tensorflow:global_step/sec: 12.5729
INFO:tensorflow:loss = 1.353298, step = 11480 (7.958 sec)
INFO:tensorflow:lr = 0.0003564118 (7.957 sec)
INFO:tensorflow:global_step/sec: 12.7091
INFO:tensorflow:loss = 1.3753021, step = 11580 (7.863 sec)
INFO:tensorflow:lr = 0.00035605376 (7.864 sec)
INFO:tensorflow:global_step/sec: 12.7804
INFO:tensorflow:loss = 1.3804079, step = 11680 (7.830 sec)
INFO:tensorflow:lr = 0.0003556961 (7.829 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.14235
INFO:tensorflow:loss = 1.3768957, step = 11780 (12.278 sec)
INFO:tensorflow:lr = 0.00035533877 (12.278 sec)
INFO:tensorflow:global_step/sec: 12.6599
INFO:tensorflow:loss = 1.3538108, step = 11880 (7.902 sec)
INFO:tensorflow:lr = 0.0003549818 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.5448
INFO:tensorflow:loss = 1.3600917, step = 11980 (7.973 sec)
INFO:tensorflow:lr = 0.00035462523 (7.975 sec)
INFO:tensorflow:global_step/sec: 12.8167
INFO:tensorflow:loss = 1.3522173, step = 12080 (7.801 sec)
INFO:tensorflow:lr = 0.00035426902 (7.805 sec)
INFO:tensorflow:global_step/sec: 12.7571
INFO:tensorflow:loss = 1.3719348, step = 12180 (7.838 sec)
INFO:tensorflow:lr = 0.00035391314 (7.832 sec)
INFO:tensorflow:global_step/sec: 12.9242
INFO:tensorflow:loss = 1.3397022, step = 12280 (7.734 sec)
INFO:tensorflow:lr = 0.00035355764 (7.735 sec)
INFO:tensorflow:global_step/sec: 12.7453
INFO:tensorflow:loss = 1.3814683, step = 12380 (7.848 sec)
INFO:tensorflow:lr = 0.0003532025 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.3341
INFO:tensorflow:loss = 1.3348244, step = 12480 (8.105 sec)
INFO:tensorflow:lr = 0.00035284765 (8.105 sec)
INFO:tensorflow:global_step/sec: 12.9432
INFO:tensorflow:loss = 1.3358412, step = 12580 (7.731 sec)
INFO:tensorflow:lr = 0.0003524932 (7.731 sec)
INFO:tensorflow:global_step/sec: 12.7795
INFO:tensorflow:loss = 1.3471819, step = 12680 (7.821 sec)
INFO:tensorflow:lr = 0.00035213912 (7.822 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.29116
INFO:tensorflow:loss = 1.3598224, step = 12780 (12.059 sec)
INFO:tensorflow:lr = 0.0003517854 (12.058 sec)
INFO:tensorflow:global_step/sec: 12.5836
INFO:tensorflow:loss = 1.3555378, step = 12880 (7.951 sec)
INFO:tensorflow:lr = 0.00035143204 (7.951 sec)
INFO:tensorflow:global_step/sec: 12.7837
INFO:tensorflow:loss = 1.3521165, step = 12980 (7.819 sec)
INFO:tensorflow:lr = 0.000351079 (7.819 sec)
INFO:tensorflow:global_step/sec: 12.7323
INFO:tensorflow:loss = 1.3695495, step = 13080 (7.859 sec)
INFO:tensorflow:lr = 0.00035072633 (7.861 sec)
INFO:tensorflow:global_step/sec: 13.0184
INFO:tensorflow:loss = 1.3140963, step = 13180 (7.676 sec)
INFO:tensorflow:lr = 0.00035037403 (7.675 sec)
INFO:tensorflow:global_step/sec: 12.6429
INFO:tensorflow:loss = 1.3322172, step = 13280 (7.910 sec)
INFO:tensorflow:lr = 0.00035002205 (7.913 sec)
INFO:tensorflow:global_step/sec: 12.6645
INFO:tensorflow:loss = 1.3830324, step = 13380 (7.901 sec)
INFO:tensorflow:lr = 0.00034967044 (7.897 sec)
INFO:tensorflow:global_step/sec: 12.349
INFO:tensorflow:loss = 1.3274176, step = 13480 (8.093 sec)
INFO:tensorflow:lr = 0.0003493192 (8.099 sec)
INFO:tensorflow:global_step/sec: 12.8935
INFO:tensorflow:loss = 1.3599035, step = 13580 (7.758 sec)
INFO:tensorflow:lr = 0.00034896831 (7.753 sec)
INFO:tensorflow:global_step/sec: 12.5766
INFO:tensorflow:loss = 1.3469765, step = 13680 (7.953 sec)
INFO:tensorflow:lr = 0.00034861776 (7.953 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.4964
INFO:tensorflow:loss = 1.3144921, step = 13780 (11.765 sec)
INFO:tensorflow:lr = 0.00034826755 (11.764 sec)
INFO:tensorflow:global_step/sec: 12.4808
INFO:tensorflow:loss = 1.4038187, step = 13880 (8.014 sec)
INFO:tensorflow:lr = 0.00034791772 (8.016 sec)
INFO:tensorflow:global_step/sec: 12.8326
INFO:tensorflow:loss = 1.3301687, step = 13980 (7.792 sec)
INFO:tensorflow:lr = 0.00034756822 (7.791 sec)
INFO:tensorflow:global_step/sec: 12.692
INFO:tensorflow:loss = 1.3259747, step = 14080 (7.882 sec)
INFO:tensorflow:lr = 0.0003472191 (7.882 sec)
INFO:tensorflow:global_step/sec: 12.7396
INFO:tensorflow:loss = 1.3204691, step = 14180 (7.846 sec)
INFO:tensorflow:lr = 0.0003468703 (7.849 sec)
INFO:tensorflow:global_step/sec: 12.5856
INFO:tensorflow:loss = 1.3055412, step = 14280 (7.946 sec)
INFO:tensorflow:lr = 0.00034652182 (7.943 sec)
INFO:tensorflow:global_step/sec: 12.639
INFO:tensorflow:loss = 1.3440651, step = 14380 (7.917 sec)
INFO:tensorflow:lr = 0.00034617377 (7.916 sec)
INFO:tensorflow:global_step/sec: 12.5423
INFO:tensorflow:loss = 1.3381974, step = 14480 (7.967 sec)
INFO:tensorflow:lr = 0.000345826 (7.969 sec)
INFO:tensorflow:global_step/sec: 12.6293
INFO:tensorflow:loss = 1.3422388, step = 14580 (7.921 sec)
INFO:tensorflow:lr = 0.00034547862 (7.921 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.63617
INFO:tensorflow:loss = 1.3256061, step = 14680 (11.581 sec)
INFO:tensorflow:lr = 0.0003451316 (11.581 sec)
INFO:tensorflow:global_step/sec: 13.0441
INFO:tensorflow:loss = 1.3087891, step = 14780 (7.665 sec)
INFO:tensorflow:lr = 0.00034478487 (7.664 sec)
INFO:tensorflow:global_step/sec: 12.7367
INFO:tensorflow:loss = 1.343419, step = 14880 (7.853 sec)
INFO:tensorflow:lr = 0.00034443854 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.7033
INFO:tensorflow:loss = 1.3251257, step = 14980 (7.869 sec)
INFO:tensorflow:lr = 0.00034409255 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.6804
INFO:tensorflow:loss = 1.34874, step = 15080 (7.890 sec)
INFO:tensorflow:lr = 0.00034374685 (7.889 sec)
INFO:tensorflow:global_step/sec: 12.414
INFO:tensorflow:loss = 1.3258908, step = 15180 (8.049 sec)
INFO:tensorflow:lr = 0.00034340157 (8.050 sec)
INFO:tensorflow:global_step/sec: 13.0191
INFO:tensorflow:loss = 1.331736, step = 15280 (7.681 sec)
INFO:tensorflow:lr = 0.00034305663 (7.684 sec)
INFO:tensorflow:global_step/sec: 12.7453
INFO:tensorflow:loss = 1.3291036, step = 15380 (7.851 sec)
INFO:tensorflow:lr = 0.000342712 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.5726
INFO:tensorflow:loss = 1.360546, step = 15480 (7.955 sec)
INFO:tensorflow:lr = 0.00034236774 (7.955 sec)
INFO:tensorflow:global_step/sec: 12.4596
INFO:tensorflow:loss = 1.3105683, step = 15580 (8.021 sec)
INFO:tensorflow:lr = 0.00034202382 (8.021 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.10404
INFO:tensorflow:loss = 1.306641, step = 15680 (10.988 sec)
INFO:tensorflow:lr = 0.00034168025 (10.990 sec)
INFO:tensorflow:global_step/sec: 12.6049
INFO:tensorflow:loss = 1.3161285, step = 15780 (7.932 sec)
INFO:tensorflow:lr = 0.00034133703 (7.931 sec)
INFO:tensorflow:global_step/sec: 13.1158
INFO:tensorflow:loss = 1.331718, step = 15880 (7.627 sec)
INFO:tensorflow:lr = 0.00034099416 (7.627 sec)
INFO:tensorflow:global_step/sec: 12.7958
INFO:tensorflow:loss = 1.3309196, step = 15980 (7.811 sec)
INFO:tensorflow:lr = 0.00034065163 (7.810 sec)
INFO:tensorflow:global_step/sec: 12.8154
INFO:tensorflow:loss = 1.3363672, step = 16080 (7.803 sec)
INFO:tensorflow:lr = 0.00034030943 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.8214
INFO:tensorflow:loss = 1.3402402, step = 16180 (7.803 sec)
INFO:tensorflow:lr = 0.00033996755 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.845
INFO:tensorflow:loss = 1.3548362, step = 16280 (7.784 sec)
INFO:tensorflow:lr = 0.00033962607 (7.785 sec)
INFO:tensorflow:global_step/sec: 12.3373
INFO:tensorflow:loss = 1.3413169, step = 16380 (8.103 sec)
INFO:tensorflow:lr = 0.0003392849 (8.102 sec)
INFO:tensorflow:global_step/sec: 12.5631
INFO:tensorflow:loss = 1.3316003, step = 16480 (7.964 sec)
INFO:tensorflow:lr = 0.00033894408 (7.964 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1431
INFO:tensorflow:loss = 1.3373045, step = 16580 (8.238 sec)
INFO:tensorflow:lr = 0.0003386036 (8.244 sec)
INFO:tensorflow:global_step/sec: 10.6592
INFO:tensorflow:loss = 1.3188674, step = 16680 (9.380 sec)
INFO:tensorflow:lr = 0.00033826346 (9.374 sec)
INFO:tensorflow:global_step/sec: 12.777
INFO:tensorflow:loss = 1.2873152, step = 16780 (7.825 sec)
INFO:tensorflow:lr = 0.00033792367 (7.825 sec)
INFO:tensorflow:global_step/sec: 12.5919
INFO:tensorflow:loss = 1.3186045, step = 16880 (7.937 sec)
INFO:tensorflow:lr = 0.00033758424 (7.937 sec)
INFO:tensorflow:global_step/sec: 12.728
INFO:tensorflow:loss = 1.3294945, step = 16980 (7.857 sec)
INFO:tensorflow:lr = 0.0003372451 (7.857 sec)
INFO:tensorflow:global_step/sec: 12.9323
INFO:tensorflow:loss = 1.3417977, step = 17080 (7.738 sec)
INFO:tensorflow:lr = 0.00033690632 (7.738 sec)
INFO:tensorflow:global_step/sec: 12.7768
INFO:tensorflow:loss = 1.3123543, step = 17180 (7.826 sec)
INFO:tensorflow:lr = 0.0003365679 (7.825 sec)
INFO:tensorflow:global_step/sec: 12.7613
INFO:tensorflow:loss = 1.319809, step = 17280 (7.834 sec)
INFO:tensorflow:lr = 0.0003362298 (7.834 sec)
INFO:tensorflow:global_step/sec: 12.5586
INFO:tensorflow:loss = 1.31707, step = 17380 (7.961 sec)
INFO:tensorflow:lr = 0.00033589205 (7.961 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.5363
INFO:tensorflow:loss = 1.3020943, step = 17480 (7.982 sec)
INFO:tensorflow:lr = 0.00033555465 (7.984 sec)
INFO:tensorflow:global_step/sec: 10.9413
INFO:tensorflow:loss = 1.3228619, step = 17580 (9.138 sec)
INFO:tensorflow:lr = 0.00033521757 (9.137 sec)
INFO:tensorflow:global_step/sec: 12.6287
INFO:tensorflow:loss = 1.3076676, step = 17680 (7.919 sec)
INFO:tensorflow:lr = 0.00033488084 (7.918 sec)
INFO:tensorflow:global_step/sec: 12.7388
INFO:tensorflow:loss = 1.301673, step = 17780 (7.849 sec)
INFO:tensorflow:lr = 0.0003345444 (7.850 sec)
INFO:tensorflow:global_step/sec: 12.7397
INFO:tensorflow:loss = 1.3108275, step = 17880 (7.846 sec)
INFO:tensorflow:lr = 0.00033420837 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.7183
INFO:tensorflow:loss = 1.3072705, step = 17980 (7.865 sec)
INFO:tensorflow:lr = 0.00033387265 (7.867 sec)
INFO:tensorflow:global_step/sec: 12.823
INFO:tensorflow:loss = 1.3254036, step = 18080 (7.801 sec)
INFO:tensorflow:lr = 0.00033353726 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.1744
INFO:tensorflow:loss = 1.299603, step = 18180 (8.208 sec)
INFO:tensorflow:lr = 0.00033320222 (8.208 sec)
INFO:tensorflow:global_step/sec: 12.6291
INFO:tensorflow:loss = 1.3302066, step = 18280 (7.918 sec)
INFO:tensorflow:lr = 0.0003328675 (7.917 sec)
INFO:tensorflow:global_step/sec: 12.6967
INFO:tensorflow:loss = 1.318776, step = 18380 (7.879 sec)
INFO:tensorflow:lr = 0.00033253315 (7.881 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.8313
INFO:tensorflow:loss = 1.2908607, step = 18480 (8.451 sec)
INFO:tensorflow:lr = 0.00033219912 (8.454 sec)
INFO:tensorflow:global_step/sec: 11.3725
INFO:tensorflow:loss = 1.3153081, step = 18580 (8.796 sec)
INFO:tensorflow:lr = 0.0003318654 (8.792 sec)
INFO:tensorflow:global_step/sec: 12.7336
INFO:tensorflow:loss = 1.3217913, step = 18680 (7.853 sec)
INFO:tensorflow:lr = 0.00033153204 (7.852 sec)
INFO:tensorflow:global_step/sec: 12.6533
INFO:tensorflow:loss = 1.3215, step = 18780 (7.904 sec)
INFO:tensorflow:lr = 0.00033119903 (7.905 sec)
INFO:tensorflow:global_step/sec: 12.4503
INFO:tensorflow:loss = 1.3031405, step = 18880 (8.031 sec)
INFO:tensorflow:lr = 0.00033086629 (8.031 sec)
INFO:tensorflow:global_step/sec: 12.6567
INFO:tensorflow:loss = 1.2904049, step = 18980 (7.896 sec)
INFO:tensorflow:lr = 0.00033053392 (7.897 sec)
INFO:tensorflow:global_step/sec: 12.6398
INFO:tensorflow:loss = 1.3116907, step = 19080 (7.912 sec)
INFO:tensorflow:lr = 0.00033020187 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.6908
INFO:tensorflow:loss = 1.3194084, step = 19180 (7.883 sec)
INFO:tensorflow:lr = 0.00032987018 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.8419
INFO:tensorflow:loss = 1.3328631, step = 19280 (7.784 sec)
INFO:tensorflow:lr = 0.00032953883 (7.784 sec)
INFO:tensorflow:global_step/sec: 13.1392
INFO:tensorflow:loss = 1.3144226, step = 19380 (7.611 sec)
INFO:tensorflow:lr = 0.0003292078 (7.611 sec)
INFO:tensorflow:global_step/sec: 12.6009
INFO:tensorflow:loss = 1.3241731, step = 19480 (7.936 sec)
INFO:tensorflow:lr = 0.0003288771 (7.936 sec)
INFO:tensorflow:Saving checkpoints for 19560 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.3418434.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-19560
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ]

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-19560
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.664
INFO:tensorflow:Best (Exact Match) Accuracy: 0.664
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-19560
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 19560 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.3048319, step = 19560
INFO:tensorflow:lr = 0.00032861278
INFO:tensorflow:global_step/sec: 10.2833
INFO:tensorflow:loss = 1.312456, step = 19660 (9.729 sec)
INFO:tensorflow:lr = 0.00032828268 (9.725 sec)
INFO:tensorflow:global_step/sec: 12.8592
INFO:tensorflow:loss = 1.3122357, step = 19760 (7.778 sec)
INFO:tensorflow:lr = 0.00032795293 (7.776 sec)
INFO:tensorflow:global_step/sec: 12.5629
INFO:tensorflow:loss = 1.315895, step = 19860 (7.960 sec)
INFO:tensorflow:lr = 0.00032762348 (7.959 sec)
INFO:tensorflow:global_step/sec: 12.982
INFO:tensorflow:loss = 1.2998242, step = 19960 (7.703 sec)
INFO:tensorflow:lr = 0.00032729437 (7.703 sec)
INFO:tensorflow:global_step/sec: 12.8239
INFO:tensorflow:loss = 1.3176674, step = 20060 (7.797 sec)
INFO:tensorflow:lr = 0.00032696562 (7.797 sec)
INFO:tensorflow:global_step/sec: 12.4351
INFO:tensorflow:loss = 1.2875775, step = 20160 (8.039 sec)
INFO:tensorflow:lr = 0.00032663712 (8.042 sec)
INFO:tensorflow:global_step/sec: 12.6837
INFO:tensorflow:loss = 1.2956387, step = 20260 (7.884 sec)
INFO:tensorflow:lr = 0.000326309 (7.881 sec)
INFO:tensorflow:global_step/sec: 12.5531
INFO:tensorflow:loss = 1.3311186, step = 20360 (7.969 sec)
INFO:tensorflow:lr = 0.00032598124 (7.968 sec)
INFO:tensorflow:global_step/sec: 12.5652
INFO:tensorflow:loss = 1.3361937, step = 20460 (7.956 sec)
INFO:tensorflow:lr = 0.0003256538 (7.955 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.18867
INFO:tensorflow:loss = 1.3309901, step = 20560 (12.216 sec)
INFO:tensorflow:lr = 0.00032532666 (12.223 sec)
INFO:tensorflow:global_step/sec: 12.6948
INFO:tensorflow:loss = 1.3054596, step = 20660 (7.873 sec)
INFO:tensorflow:lr = 0.00032499988 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.5301
INFO:tensorflow:loss = 1.2792804, step = 20760 (7.981 sec)
INFO:tensorflow:lr = 0.0003246734 (7.985 sec)
INFO:tensorflow:global_step/sec: 12.663
INFO:tensorflow:loss = 1.3026924, step = 20860 (7.897 sec)
INFO:tensorflow:lr = 0.00032434726 (7.895 sec)
INFO:tensorflow:global_step/sec: 12.7051
INFO:tensorflow:loss = 1.358359, step = 20960 (7.876 sec)
INFO:tensorflow:lr = 0.00032402144 (7.874 sec)
INFO:tensorflow:global_step/sec: 12.7735
INFO:tensorflow:loss = 1.3020449, step = 21060 (7.823 sec)
INFO:tensorflow:lr = 0.00032369597 (7.823 sec)
INFO:tensorflow:global_step/sec: 13.1674
INFO:tensorflow:loss = 1.3003097, step = 21160 (7.595 sec)
INFO:tensorflow:lr = 0.00032337077 (7.595 sec)
INFO:tensorflow:global_step/sec: 12.728
INFO:tensorflow:loss = 1.2887429, step = 21260 (7.863 sec)
INFO:tensorflow:lr = 0.00032304594 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.7174
INFO:tensorflow:loss = 1.3302351, step = 21360 (7.857 sec)
INFO:tensorflow:lr = 0.00032272143 (7.860 sec)
INFO:tensorflow:global_step/sec: 12.7107
INFO:tensorflow:loss = 1.3106179, step = 21460 (7.867 sec)
INFO:tensorflow:lr = 0.00032239725 (7.864 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.24138
INFO:tensorflow:loss = 1.2837156, step = 21560 (12.140 sec)
INFO:tensorflow:lr = 0.0003220734 (12.140 sec)
INFO:tensorflow:global_step/sec: 13.0831
INFO:tensorflow:loss = 1.3228761, step = 21660 (7.645 sec)
INFO:tensorflow:lr = 0.00032174986 (7.644 sec)
INFO:tensorflow:global_step/sec: 12.8614
INFO:tensorflow:loss = 1.312087, step = 21760 (7.773 sec)
INFO:tensorflow:lr = 0.00032142666 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.7587
INFO:tensorflow:loss = 1.3115535, step = 21860 (7.835 sec)
INFO:tensorflow:lr = 0.00032110378 (7.834 sec)
INFO:tensorflow:global_step/sec: 12.4595
INFO:tensorflow:loss = 1.2954695, step = 21960 (8.028 sec)
INFO:tensorflow:lr = 0.00032078126 (8.029 sec)
INFO:tensorflow:global_step/sec: 12.8623
INFO:tensorflow:loss = 1.2953963, step = 22060 (7.773 sec)
INFO:tensorflow:lr = 0.000320459 (7.774 sec)
INFO:tensorflow:global_step/sec: 12.7449
INFO:tensorflow:loss = 1.3128618, step = 22160 (7.843 sec)
INFO:tensorflow:lr = 0.00032013707 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.622
INFO:tensorflow:loss = 1.3067259, step = 22260 (7.925 sec)
INFO:tensorflow:lr = 0.00031981547 (7.921 sec)
INFO:tensorflow:global_step/sec: 12.5084
INFO:tensorflow:loss = 1.3142986, step = 22360 (7.993 sec)
INFO:tensorflow:lr = 0.00031949423 (7.993 sec)
INFO:tensorflow:global_step/sec: 12.831
INFO:tensorflow:loss = 1.3074307, step = 22460 (7.793 sec)
INFO:tensorflow:lr = 0.00031917327 (7.792 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.2055
INFO:tensorflow:loss = 1.2916995, step = 22560 (12.186 sec)
INFO:tensorflow:lr = 0.0003188527 (12.189 sec)
INFO:tensorflow:global_step/sec: 12.8634
INFO:tensorflow:loss = 1.2907739, step = 22660 (7.779 sec)
INFO:tensorflow:lr = 0.00031853237 (7.777 sec)
INFO:tensorflow:global_step/sec: 12.8974
INFO:tensorflow:loss = 1.2921684, step = 22760 (7.755 sec)
INFO:tensorflow:lr = 0.0003182124 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.7443
INFO:tensorflow:loss = 1.2923056, step = 22860 (7.844 sec)
INFO:tensorflow:lr = 0.00031789276 (7.840 sec)
INFO:tensorflow:global_step/sec: 12.6921
INFO:tensorflow:loss = 1.2913071, step = 22960 (7.875 sec)
INFO:tensorflow:lr = 0.00031757343 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.6585
INFO:tensorflow:loss = 1.2972944, step = 23060 (7.902 sec)
INFO:tensorflow:lr = 0.0003172544 (7.903 sec)
INFO:tensorflow:global_step/sec: 12.8911
INFO:tensorflow:loss = 1.28654, step = 23160 (7.756 sec)
INFO:tensorflow:lr = 0.0003169357 (7.755 sec)
INFO:tensorflow:global_step/sec: 12.6817
INFO:tensorflow:loss = 1.3095835, step = 23260 (7.889 sec)
INFO:tensorflow:lr = 0.00031661734 (7.889 sec)
INFO:tensorflow:global_step/sec: 12.514
INFO:tensorflow:loss = 1.3168696, step = 23360 (7.989 sec)
INFO:tensorflow:lr = 0.0003162993 (7.989 sec)
INFO:tensorflow:global_step/sec: 12.7126
INFO:tensorflow:loss = 1.2910316, step = 23460 (7.864 sec)
INFO:tensorflow:lr = 0.00031598154 (7.863 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.40655
INFO:tensorflow:loss = 1.2932509, step = 23560 (11.898 sec)
INFO:tensorflow:lr = 0.00031566413 (11.898 sec)
INFO:tensorflow:global_step/sec: 12.81
INFO:tensorflow:loss = 1.2906524, step = 23660 (7.808 sec)
INFO:tensorflow:lr = 0.00031534708 (7.809 sec)
INFO:tensorflow:global_step/sec: 13.0227
INFO:tensorflow:loss = 1.2930197, step = 23760 (7.675 sec)
INFO:tensorflow:lr = 0.00031503028 (7.678 sec)
INFO:tensorflow:global_step/sec: 12.5006
INFO:tensorflow:loss = 1.3265917, step = 23860 (7.999 sec)
INFO:tensorflow:lr = 0.0003147138 (7.995 sec)
INFO:tensorflow:global_step/sec: 12.707
INFO:tensorflow:loss = 1.2934457, step = 23960 (7.870 sec)
INFO:tensorflow:lr = 0.00031439765 (7.870 sec)
INFO:tensorflow:global_step/sec: 12.3301
INFO:tensorflow:loss = 1.303881, step = 24060 (8.110 sec)
INFO:tensorflow:lr = 0.00031408184 (8.110 sec)
INFO:tensorflow:global_step/sec: 12.8441
INFO:tensorflow:loss = 1.3020984, step = 24160 (7.789 sec)
INFO:tensorflow:lr = 0.00031376636 (7.790 sec)
INFO:tensorflow:global_step/sec: 12.703
INFO:tensorflow:loss = 1.3089213, step = 24260 (7.869 sec)
INFO:tensorflow:lr = 0.00031345116 (7.871 sec)
INFO:tensorflow:global_step/sec: 12.6076
INFO:tensorflow:loss = 1.2835792, step = 24360 (7.932 sec)
INFO:tensorflow:lr = 0.0003131363 (7.930 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.6078
INFO:tensorflow:loss = 1.30011, step = 24460 (11.617 sec)
INFO:tensorflow:lr = 0.00031282174 (11.619 sec)
INFO:tensorflow:global_step/sec: 12.8552
INFO:tensorflow:loss = 1.2753806, step = 24560 (7.786 sec)
INFO:tensorflow:lr = 0.0003125075 (7.783 sec)
INFO:tensorflow:global_step/sec: 12.3914
INFO:tensorflow:loss = 1.2902484, step = 24660 (8.063 sec)
INFO:tensorflow:lr = 0.0003121936 (8.063 sec)
INFO:tensorflow:global_step/sec: 12.7618
INFO:tensorflow:loss = 1.3047645, step = 24760 (7.836 sec)
INFO:tensorflow:lr = 0.00031188 (7.837 sec)
INFO:tensorflow:global_step/sec: 12.8865
INFO:tensorflow:loss = 1.2961329, step = 24860 (7.767 sec)
INFO:tensorflow:lr = 0.0003115667 (7.767 sec)
INFO:tensorflow:global_step/sec: 12.9008
INFO:tensorflow:loss = 1.2774085, step = 24960 (7.748 sec)
INFO:tensorflow:lr = 0.0003112537 (7.749 sec)
INFO:tensorflow:global_step/sec: 12.804
INFO:tensorflow:loss = 1.2744296, step = 25060 (7.810 sec)
INFO:tensorflow:lr = 0.00031094105 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.8994
INFO:tensorflow:loss = 1.299216, step = 25160 (7.749 sec)
INFO:tensorflow:lr = 0.0003106287 (7.748 sec)
INFO:tensorflow:global_step/sec: 12.8665
INFO:tensorflow:loss = 1.2802867, step = 25260 (7.776 sec)
INFO:tensorflow:lr = 0.00031031665 (7.777 sec)
INFO:tensorflow:global_step/sec: 12.7289
INFO:tensorflow:loss = 1.3002493, step = 25360 (7.857 sec)
INFO:tensorflow:lr = 0.00031000495 (7.855 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.09796
INFO:tensorflow:loss = 1.315465, step = 25460 (10.988 sec)
INFO:tensorflow:lr = 0.00030969354 (10.988 sec)
INFO:tensorflow:global_step/sec: 12.8865
INFO:tensorflow:loss = 1.2996613, step = 25560 (7.759 sec)
INFO:tensorflow:lr = 0.00030938242 (7.765 sec)
INFO:tensorflow:global_step/sec: 12.6831
INFO:tensorflow:loss = 1.2841055, step = 25660 (7.888 sec)
INFO:tensorflow:lr = 0.00030907162 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.9739
INFO:tensorflow:loss = 1.2864649, step = 25760 (7.708 sec)
INFO:tensorflow:lr = 0.00030876117 (7.708 sec)
INFO:tensorflow:global_step/sec: 12.7143
INFO:tensorflow:loss = 1.2838994, step = 25860 (7.866 sec)
INFO:tensorflow:lr = 0.000308451 (7.866 sec)
INFO:tensorflow:global_step/sec: 13.0226
INFO:tensorflow:loss = 1.2848786, step = 25960 (7.674 sec)
INFO:tensorflow:lr = 0.00030814117 (7.675 sec)
INFO:tensorflow:global_step/sec: 12.8533
INFO:tensorflow:loss = 1.2814575, step = 26060 (7.780 sec)
INFO:tensorflow:lr = 0.00030783165 (7.781 sec)
INFO:tensorflow:global_step/sec: 12.5923
INFO:tensorflow:loss = 1.2896702, step = 26160 (7.941 sec)
INFO:tensorflow:lr = 0.0003075224 (7.943 sec)
INFO:tensorflow:global_step/sec: 12.7118
INFO:tensorflow:loss = 1.2936949, step = 26260 (7.871 sec)
INFO:tensorflow:lr = 0.00030721352 (7.868 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1137
INFO:tensorflow:loss = 1.2839646, step = 26360 (8.256 sec)
INFO:tensorflow:lr = 0.0003069049 (8.256 sec)
INFO:tensorflow:global_step/sec: 10.4227
INFO:tensorflow:loss = 1.2964764, step = 26460 (9.589 sec)
INFO:tensorflow:lr = 0.0003065966 (9.591 sec)
INFO:tensorflow:global_step/sec: 12.6315
INFO:tensorflow:loss = 1.2799263, step = 26560 (7.921 sec)
INFO:tensorflow:lr = 0.0003062886 (7.919 sec)
INFO:tensorflow:global_step/sec: 12.813
INFO:tensorflow:loss = 1.2930382, step = 26660 (7.801 sec)
INFO:tensorflow:lr = 0.00030598094 (7.802 sec)
INFO:tensorflow:global_step/sec: 12.7167
INFO:tensorflow:loss = 1.2775872, step = 26760 (7.863 sec)
INFO:tensorflow:lr = 0.00030567357 (7.862 sec)
INFO:tensorflow:global_step/sec: 12.5424
INFO:tensorflow:loss = 1.2938052, step = 26860 (7.977 sec)
INFO:tensorflow:lr = 0.0003053665 (7.977 sec)
INFO:tensorflow:global_step/sec: 12.9605
INFO:tensorflow:loss = 1.3075194, step = 26960 (7.711 sec)
INFO:tensorflow:lr = 0.00030505977 (7.711 sec)
INFO:tensorflow:global_step/sec: 12.644
INFO:tensorflow:loss = 1.2937547, step = 27060 (7.909 sec)
INFO:tensorflow:lr = 0.0003047533 (7.910 sec)
INFO:tensorflow:global_step/sec: 13.0595
INFO:tensorflow:loss = 1.3111972, step = 27160 (7.662 sec)
INFO:tensorflow:lr = 0.0003044472 (7.662 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.5976
INFO:tensorflow:loss = 1.2813871, step = 27260 (7.937 sec)
INFO:tensorflow:lr = 0.00030414137 (7.938 sec)
INFO:tensorflow:global_step/sec: 10.8542
INFO:tensorflow:loss = 1.2741573, step = 27360 (9.215 sec)
INFO:tensorflow:lr = 0.00030383587 (9.214 sec)
INFO:tensorflow:global_step/sec: 12.9826
INFO:tensorflow:loss = 1.2877482, step = 27460 (7.701 sec)
INFO:tensorflow:lr = 0.00030353063 (7.701 sec)
INFO:tensorflow:global_step/sec: 12.439
INFO:tensorflow:loss = 1.2878534, step = 27560 (8.035 sec)
INFO:tensorflow:lr = 0.0003032257 (8.036 sec)
INFO:tensorflow:global_step/sec: 12.477
INFO:tensorflow:loss = 1.2885484, step = 27660 (8.014 sec)
INFO:tensorflow:lr = 0.0003029211 (8.013 sec)
INFO:tensorflow:global_step/sec: 12.4905
INFO:tensorflow:loss = 1.2796994, step = 27760 (8.006 sec)
INFO:tensorflow:lr = 0.00030261683 (8.006 sec)
INFO:tensorflow:global_step/sec: 12.8284
INFO:tensorflow:loss = 1.2923272, step = 27860 (7.799 sec)
INFO:tensorflow:lr = 0.00030231284 (7.802 sec)
INFO:tensorflow:global_step/sec: 12.7148
INFO:tensorflow:loss = 1.2721691, step = 27960 (7.866 sec)
INFO:tensorflow:lr = 0.00030200917 (7.864 sec)
INFO:tensorflow:global_step/sec: 12.9207
INFO:tensorflow:loss = 1.2802061, step = 28060 (7.739 sec)
INFO:tensorflow:lr = 0.0003017058 (7.738 sec)
INFO:tensorflow:global_step/sec: 12.7999
INFO:tensorflow:loss = 1.2846918, step = 28160 (7.813 sec)
INFO:tensorflow:lr = 0.00030140273 (7.813 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.8178
INFO:tensorflow:loss = 1.2896069, step = 28260 (8.461 sec)
INFO:tensorflow:lr = 0.00030109996 (8.461 sec)
INFO:tensorflow:global_step/sec: 11.4031
INFO:tensorflow:loss = 1.2732713, step = 28360 (8.769 sec)
INFO:tensorflow:lr = 0.0003007975 (8.769 sec)
INFO:tensorflow:global_step/sec: 12.6608
INFO:tensorflow:loss = 1.2760838, step = 28460 (7.895 sec)
INFO:tensorflow:lr = 0.00030049533 (7.900 sec)
INFO:tensorflow:global_step/sec: 12.5912
INFO:tensorflow:loss = 1.285021, step = 28560 (7.944 sec)
INFO:tensorflow:lr = 0.00030019347 (7.939 sec)
INFO:tensorflow:global_step/sec: 12.6283
INFO:tensorflow:loss = 1.2831901, step = 28660 (7.922 sec)
INFO:tensorflow:lr = 0.00029989192 (7.922 sec)
INFO:tensorflow:global_step/sec: 12.5436
INFO:tensorflow:loss = 1.2798933, step = 28760 (7.970 sec)
INFO:tensorflow:lr = 0.00029959064 (7.970 sec)
INFO:tensorflow:global_step/sec: 12.9383
INFO:tensorflow:loss = 1.2905648, step = 28860 (7.730 sec)
INFO:tensorflow:lr = 0.0002992897 (7.730 sec)
INFO:tensorflow:global_step/sec: 13.0137
INFO:tensorflow:loss = 1.2883794, step = 28960 (7.680 sec)
INFO:tensorflow:lr = 0.00029898906 (7.680 sec)
INFO:tensorflow:global_step/sec: 12.8798
INFO:tensorflow:loss = 1.2834778, step = 29060 (7.764 sec)
INFO:tensorflow:lr = 0.00029868874 (7.764 sec)
INFO:tensorflow:global_step/sec: 12.8779
INFO:tensorflow:loss = 1.2783784, step = 29160 (7.765 sec)
INFO:tensorflow:lr = 0.00029838865 (7.770 sec)
INFO:tensorflow:global_step/sec: 12.7015
INFO:tensorflow:loss = 1.2855964, step = 29260 (7.874 sec)
INFO:tensorflow:lr = 0.00029808894 (7.877 sec)
INFO:tensorflow:Saving checkpoints for 29340 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.302846.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-29340
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-29340
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.702
INFO:tensorflow:Best (Exact Match) Accuracy: 0.702
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-29340
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 29340 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2902774, step = 29340
INFO:tensorflow:lr = 0.0002978494
INFO:tensorflow:global_step/sec: 10.3227
INFO:tensorflow:loss = 1.3032885, step = 29440 (9.692 sec)
INFO:tensorflow:lr = 0.0002975502 (9.693 sec)
INFO:tensorflow:global_step/sec: 12.3379
INFO:tensorflow:loss = 1.2751992, step = 29540 (8.106 sec)
INFO:tensorflow:lr = 0.0002972513 (8.105 sec)
INFO:tensorflow:global_step/sec: 12.8195
INFO:tensorflow:loss = 1.2912132, step = 29640 (7.800 sec)
INFO:tensorflow:lr = 0.0002969527 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.4392
INFO:tensorflow:loss = 1.2732567, step = 29740 (8.036 sec)
INFO:tensorflow:lr = 0.00029665435 (8.039 sec)
INFO:tensorflow:global_step/sec: 12.5569
INFO:tensorflow:loss = 1.2769362, step = 29840 (7.967 sec)
INFO:tensorflow:lr = 0.0002963564 (7.966 sec)
INFO:tensorflow:global_step/sec: 12.9836
INFO:tensorflow:loss = 1.2793033, step = 29940 (7.699 sec)
INFO:tensorflow:lr = 0.00029605866 (7.702 sec)
INFO:tensorflow:global_step/sec: 12.5844
INFO:tensorflow:loss = 1.2748176, step = 30040 (7.947 sec)
INFO:tensorflow:lr = 0.0002957613 (7.943 sec)
INFO:tensorflow:global_step/sec: 12.7121
INFO:tensorflow:loss = 1.2927984, step = 30140 (7.866 sec)
INFO:tensorflow:lr = 0.00029546418 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.6349
INFO:tensorflow:loss = 1.2704685, step = 30240 (7.915 sec)
INFO:tensorflow:lr = 0.00029516738 (7.913 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.30175
INFO:tensorflow:loss = 1.2709056, step = 30340 (12.049 sec)
INFO:tensorflow:lr = 0.0002948709 (12.050 sec)
INFO:tensorflow:global_step/sec: 12.6638
INFO:tensorflow:loss = 1.2773079, step = 30440 (7.898 sec)
INFO:tensorflow:lr = 0.00029457468 (7.897 sec)
INFO:tensorflow:global_step/sec: 12.4741
INFO:tensorflow:loss = 1.2764441, step = 30540 (8.016 sec)
INFO:tensorflow:lr = 0.00029427878 (8.018 sec)
INFO:tensorflow:global_step/sec: 12.7293
INFO:tensorflow:loss = 1.2704064, step = 30640 (7.857 sec)
INFO:tensorflow:lr = 0.00029398318 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.6686
INFO:tensorflow:loss = 1.2712173, step = 30740 (7.893 sec)
INFO:tensorflow:lr = 0.00029368783 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.7314
INFO:tensorflow:loss = 1.3050127, step = 30840 (7.851 sec)
INFO:tensorflow:lr = 0.0002933928 (7.852 sec)
INFO:tensorflow:global_step/sec: 12.8834
INFO:tensorflow:loss = 1.2784503, step = 30940 (7.765 sec)
INFO:tensorflow:lr = 0.0002930981 (7.764 sec)
INFO:tensorflow:global_step/sec: 12.88
INFO:tensorflow:loss = 1.2874303, step = 31040 (7.764 sec)
INFO:tensorflow:lr = 0.00029280368 (7.764 sec)
INFO:tensorflow:global_step/sec: 12.9115
INFO:tensorflow:loss = 1.2781101, step = 31140 (7.746 sec)
INFO:tensorflow:lr = 0.00029250956 (7.746 sec)
INFO:tensorflow:global_step/sec: 12.6392
INFO:tensorflow:loss = 1.2868813, step = 31240 (7.911 sec)
INFO:tensorflow:lr = 0.00029221573 (7.913 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.37144
INFO:tensorflow:loss = 1.2743399, step = 31340 (11.942 sec)
INFO:tensorflow:lr = 0.0002919222 (11.940 sec)
INFO:tensorflow:global_step/sec: 12.4837
INFO:tensorflow:loss = 1.2944267, step = 31440 (8.010 sec)
INFO:tensorflow:lr = 0.00029162894 (8.011 sec)
INFO:tensorflow:global_step/sec: 12.7212
INFO:tensorflow:loss = 1.3041955, step = 31540 (7.865 sec)
INFO:tensorflow:lr = 0.000291336 (7.864 sec)
INFO:tensorflow:global_step/sec: 12.9116
INFO:tensorflow:loss = 1.27363, step = 31640 (7.741 sec)
INFO:tensorflow:lr = 0.00029104334 (7.742 sec)
INFO:tensorflow:global_step/sec: 12.7415
INFO:tensorflow:loss = 1.3110542, step = 31740 (7.853 sec)
INFO:tensorflow:lr = 0.00029075096 (7.852 sec)
INFO:tensorflow:global_step/sec: 13.0078
INFO:tensorflow:loss = 1.2707573, step = 31840 (7.687 sec)
INFO:tensorflow:lr = 0.00029045888 (7.686 sec)
INFO:tensorflow:global_step/sec: 12.6669
INFO:tensorflow:loss = 1.2790074, step = 31940 (7.896 sec)
INFO:tensorflow:lr = 0.00029016714 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.9049
INFO:tensorflow:loss = 1.27734, step = 32040 (7.748 sec)
INFO:tensorflow:lr = 0.00028987564 (7.748 sec)
INFO:tensorflow:global_step/sec: 12.6828
INFO:tensorflow:loss = 1.2766548, step = 32140 (7.881 sec)
INFO:tensorflow:lr = 0.00028958445 (7.881 sec)
INFO:tensorflow:global_step/sec: 12.6536
INFO:tensorflow:loss = 1.270347, step = 32240 (7.904 sec)
INFO:tensorflow:lr = 0.00028929356 (7.903 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.34015
INFO:tensorflow:loss = 1.2706623, step = 32340 (11.991 sec)
INFO:tensorflow:lr = 0.00028900296 (11.991 sec)
INFO:tensorflow:global_step/sec: 12.6105
INFO:tensorflow:loss = 1.2677004, step = 32440 (7.932 sec)
INFO:tensorflow:lr = 0.00028871265 (7.933 sec)
INFO:tensorflow:global_step/sec: 12.8231
INFO:tensorflow:loss = 1.2773702, step = 32540 (7.795 sec)
INFO:tensorflow:lr = 0.00028842266 (7.799 sec)
INFO:tensorflow:global_step/sec: 12.9974
INFO:tensorflow:loss = 1.2898613, step = 32640 (7.699 sec)
INFO:tensorflow:lr = 0.0002881329 (7.695 sec)
INFO:tensorflow:global_step/sec: 12.4858
INFO:tensorflow:loss = 1.2836853, step = 32740 (8.008 sec)
INFO:tensorflow:lr = 0.00028784346 (8.008 sec)
INFO:tensorflow:global_step/sec: 12.8931
INFO:tensorflow:loss = 1.2881771, step = 32840 (7.751 sec)
INFO:tensorflow:lr = 0.00028755434 (7.752 sec)
INFO:tensorflow:global_step/sec: 12.819
INFO:tensorflow:loss = 1.276155, step = 32940 (7.801 sec)
INFO:tensorflow:lr = 0.00028726546 (7.801 sec)
INFO:tensorflow:global_step/sec: 12.7679
INFO:tensorflow:loss = 1.3059559, step = 33040 (7.833 sec)
INFO:tensorflow:lr = 0.0002869769 (7.832 sec)
INFO:tensorflow:global_step/sec: 12.8372
INFO:tensorflow:loss = 1.2818044, step = 33140 (7.793 sec)
INFO:tensorflow:lr = 0.00028668862 (7.793 sec)
INFO:tensorflow:global_step/sec: 12.6358
INFO:tensorflow:loss = 1.272675, step = 33240 (7.911 sec)
INFO:tensorflow:lr = 0.00028640064 (7.910 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.43506
INFO:tensorflow:loss = 1.2660692, step = 33340 (11.861 sec)
INFO:tensorflow:lr = 0.00028611295 (11.861 sec)
INFO:tensorflow:global_step/sec: 12.8342
INFO:tensorflow:loss = 1.274544, step = 33440 (7.791 sec)
INFO:tensorflow:lr = 0.00028582552 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.4115
INFO:tensorflow:loss = 1.282098, step = 33540 (8.055 sec)
INFO:tensorflow:lr = 0.0002855384 (8.054 sec)
INFO:tensorflow:global_step/sec: 12.8384
INFO:tensorflow:loss = 1.271896, step = 33640 (7.786 sec)
INFO:tensorflow:lr = 0.0002852516 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.7124
INFO:tensorflow:loss = 1.2689635, step = 33740 (7.871 sec)
INFO:tensorflow:lr = 0.00028496503 (7.870 sec)
INFO:tensorflow:global_step/sec: 12.8111
INFO:tensorflow:loss = 1.2838228, step = 33840 (7.802 sec)
INFO:tensorflow:lr = 0.0002846788 (7.802 sec)
INFO:tensorflow:global_step/sec: 12.779
INFO:tensorflow:loss = 1.2770149, step = 33940 (7.825 sec)
INFO:tensorflow:lr = 0.0002843928 (7.825 sec)
INFO:tensorflow:global_step/sec: 13.0904
INFO:tensorflow:loss = 1.266436, step = 34040 (7.638 sec)
INFO:tensorflow:lr = 0.00028410714 (7.642 sec)
INFO:tensorflow:global_step/sec: 12.6556
INFO:tensorflow:loss = 1.2893338, step = 34140 (7.908 sec)
INFO:tensorflow:lr = 0.00028382175 (7.904 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.60813
INFO:tensorflow:loss = 1.2691966, step = 34240 (11.615 sec)
INFO:tensorflow:lr = 0.00028353665 (11.616 sec)
INFO:tensorflow:global_step/sec: 12.5767
INFO:tensorflow:loss = 1.2772423, step = 34340 (7.948 sec)
INFO:tensorflow:lr = 0.0002832518 (7.948 sec)
INFO:tensorflow:global_step/sec: 12.8296
INFO:tensorflow:loss = 1.2685624, step = 34440 (7.794 sec)
INFO:tensorflow:lr = 0.00028296726 (7.794 sec)
INFO:tensorflow:global_step/sec: 12.8444
INFO:tensorflow:loss = 1.2796193, step = 34540 (7.787 sec)
INFO:tensorflow:lr = 0.000282683 (7.786 sec)
INFO:tensorflow:global_step/sec: 12.9569
INFO:tensorflow:loss = 1.2901658, step = 34640 (7.717 sec)
INFO:tensorflow:lr = 0.00028239907 (7.717 sec)
INFO:tensorflow:global_step/sec: 12.907
INFO:tensorflow:loss = 1.2649109, step = 34740 (7.754 sec)
INFO:tensorflow:lr = 0.0002821154 (7.754 sec)
INFO:tensorflow:global_step/sec: 12.8117
INFO:tensorflow:loss = 1.2722139, step = 34840 (7.804 sec)
INFO:tensorflow:lr = 0.000281832 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.7117
INFO:tensorflow:loss = 1.2853813, step = 34940 (7.862 sec)
INFO:tensorflow:lr = 0.00028154888 (7.861 sec)
INFO:tensorflow:global_step/sec: 12.6376
INFO:tensorflow:loss = 1.2778032, step = 35040 (7.915 sec)
INFO:tensorflow:lr = 0.00028126605 (7.916 sec)
INFO:tensorflow:global_step/sec: 12.8204
INFO:tensorflow:loss = 1.2695035, step = 35140 (7.799 sec)
INFO:tensorflow:lr = 0.00028098354 (7.798 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.08278
INFO:tensorflow:loss = 1.2864376, step = 35240 (11.012 sec)
INFO:tensorflow:lr = 0.00028070126 (11.012 sec)
INFO:tensorflow:global_step/sec: 12.3979
INFO:tensorflow:loss = 1.2693602, step = 35340 (8.065 sec)
INFO:tensorflow:lr = 0.0002804193 (8.068 sec)
INFO:tensorflow:global_step/sec: 12.9214
INFO:tensorflow:loss = 1.2835609, step = 35440 (7.743 sec)
INFO:tensorflow:lr = 0.0002801376 (7.740 sec)
INFO:tensorflow:global_step/sec: 12.5272
INFO:tensorflow:loss = 1.2637956, step = 35540 (7.981 sec)
INFO:tensorflow:lr = 0.0002798562 (7.981 sec)
INFO:tensorflow:global_step/sec: 12.9356
INFO:tensorflow:loss = 1.2700819, step = 35640 (7.730 sec)
INFO:tensorflow:lr = 0.00027957506 (7.730 sec)
INFO:tensorflow:global_step/sec: 12.8449
INFO:tensorflow:loss = 1.2769866, step = 35740 (7.781 sec)
INFO:tensorflow:lr = 0.0002792942 (7.781 sec)
INFO:tensorflow:global_step/sec: 12.7669
INFO:tensorflow:loss = 1.2878106, step = 35840 (7.833 sec)
INFO:tensorflow:lr = 0.00027901368 (7.834 sec)
INFO:tensorflow:global_step/sec: 12.4951
INFO:tensorflow:loss = 1.2848315, step = 35940 (8.003 sec)
INFO:tensorflow:lr = 0.00027873338 (8.003 sec)
INFO:tensorflow:global_step/sec: 12.9564
INFO:tensorflow:loss = 1.2649281, step = 36040 (7.718 sec)
INFO:tensorflow:lr = 0.0002784534 (7.717 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.5196
INFO:tensorflow:loss = 1.2739855, step = 36140 (7.988 sec)
INFO:tensorflow:lr = 0.00027817365 (7.988 sec)
INFO:tensorflow:global_step/sec: 10.5621
INFO:tensorflow:loss = 1.2650766, step = 36240 (9.467 sec)
INFO:tensorflow:lr = 0.00027789423 (9.468 sec)
INFO:tensorflow:global_step/sec: 12.7425
INFO:tensorflow:loss = 1.2738944, step = 36340 (7.853 sec)
INFO:tensorflow:lr = 0.0002776151 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.5367
INFO:tensorflow:loss = 1.2752404, step = 36440 (7.974 sec)
INFO:tensorflow:lr = 0.00027733622 (7.974 sec)
INFO:tensorflow:global_step/sec: 12.9389
INFO:tensorflow:loss = 1.2804888, step = 36540 (7.727 sec)
INFO:tensorflow:lr = 0.00027705764 (7.726 sec)
INFO:tensorflow:global_step/sec: 12.625
INFO:tensorflow:loss = 1.2651876, step = 36640 (7.925 sec)
INFO:tensorflow:lr = 0.00027677935 (7.925 sec)
INFO:tensorflow:global_step/sec: 12.6561
INFO:tensorflow:loss = 1.2666996, step = 36740 (7.898 sec)
INFO:tensorflow:lr = 0.0002765013 (7.899 sec)
INFO:tensorflow:global_step/sec: 12.6222
INFO:tensorflow:loss = 1.288384, step = 36840 (7.924 sec)
INFO:tensorflow:lr = 0.00027622355 (7.923 sec)
INFO:tensorflow:global_step/sec: 12.5421
INFO:tensorflow:loss = 1.2701671, step = 36940 (7.970 sec)
INFO:tensorflow:lr = 0.00027594608 (7.972 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 13.1055
INFO:tensorflow:loss = 1.2687078, step = 37040 (7.635 sec)
INFO:tensorflow:lr = 0.00027566886 (7.636 sec)
INFO:tensorflow:global_step/sec: 11.2215
INFO:tensorflow:loss = 1.2759229, step = 37140 (8.909 sec)
INFO:tensorflow:lr = 0.00027539194 (8.908 sec)
INFO:tensorflow:global_step/sec: 12.6468
INFO:tensorflow:loss = 1.2758858, step = 37240 (7.912 sec)
INFO:tensorflow:lr = 0.0002751153 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.3398
INFO:tensorflow:loss = 1.266111, step = 37340 (8.101 sec)
INFO:tensorflow:lr = 0.00027483894 (8.101 sec)
INFO:tensorflow:global_step/sec: 12.7537
INFO:tensorflow:loss = 1.2725819, step = 37440 (7.836 sec)
INFO:tensorflow:lr = 0.00027456286 (7.837 sec)
INFO:tensorflow:global_step/sec: 13.1806
INFO:tensorflow:loss = 1.2705429, step = 37540 (7.588 sec)
INFO:tensorflow:lr = 0.00027428704 (7.586 sec)
INFO:tensorflow:global_step/sec: 13.1254
INFO:tensorflow:loss = 1.2754468, step = 37640 (7.624 sec)
INFO:tensorflow:lr = 0.00027401155 (7.625 sec)
INFO:tensorflow:global_step/sec: 12.63
INFO:tensorflow:loss = 1.2782013, step = 37740 (7.914 sec)
INFO:tensorflow:lr = 0.00027373628 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.6325
INFO:tensorflow:loss = 1.2712921, step = 37840 (7.913 sec)
INFO:tensorflow:lr = 0.0002734613 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.4989
INFO:tensorflow:loss = 1.2724797, step = 37940 (8.004 sec)
INFO:tensorflow:lr = 0.00027318663 (8.004 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.9641
INFO:tensorflow:loss = 1.2724507, step = 38040 (8.361 sec)
INFO:tensorflow:lr = 0.0002729122 (8.360 sec)
INFO:tensorflow:global_step/sec: 11.1246
INFO:tensorflow:loss = 1.2643977, step = 38140 (8.983 sec)
INFO:tensorflow:lr = 0.00027263802 (8.984 sec)
INFO:tensorflow:global_step/sec: 12.8127
INFO:tensorflow:loss = 1.2717063, step = 38240 (7.812 sec)
INFO:tensorflow:lr = 0.00027236415 (7.811 sec)
INFO:tensorflow:global_step/sec: 12.9284
INFO:tensorflow:loss = 1.2676791, step = 38340 (7.731 sec)
INFO:tensorflow:lr = 0.00027209055 (7.738 sec)
INFO:tensorflow:global_step/sec: 13.087
INFO:tensorflow:loss = 1.2721039, step = 38440 (7.644 sec)
INFO:tensorflow:lr = 0.00027181726 (7.637 sec)
INFO:tensorflow:global_step/sec: 12.8318
INFO:tensorflow:loss = 1.2676044, step = 38540 (7.788 sec)
INFO:tensorflow:lr = 0.00027154418 (7.789 sec)
INFO:tensorflow:global_step/sec: 12.6748
INFO:tensorflow:loss = 1.2753915, step = 38640 (7.894 sec)
INFO:tensorflow:lr = 0.00027127142 (7.894 sec)
INFO:tensorflow:global_step/sec: 12.6085
INFO:tensorflow:loss = 1.2720599, step = 38740 (7.926 sec)
INFO:tensorflow:lr = 0.00027099892 (7.926 sec)
INFO:tensorflow:global_step/sec: 12.7104
INFO:tensorflow:loss = 1.2626356, step = 38840 (7.874 sec)
INFO:tensorflow:lr = 0.0002707267 (7.874 sec)
INFO:tensorflow:global_step/sec: 12.696
INFO:tensorflow:loss = 1.2689277, step = 38940 (7.874 sec)
INFO:tensorflow:lr = 0.00027045477 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.6811
INFO:tensorflow:loss = 1.2729962, step = 39040 (7.887 sec)
INFO:tensorflow:lr = 0.00027018308 (7.883 sec)
INFO:tensorflow:Saving checkpoints for 39120 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2890505.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-39120
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                                
  __________________________|_____________________________________________________________                          
 |     |    |     |                        |                                         sl:location                   
 |     |    |     |                        |                                              |                         
 |     |    |     |                        |                                       in:get_location                 
 |     |    |     |                        |                              ________________|_______________          
 |     |    |     |                 sl:category_even              sl:search_radius                 sl:location_user
 |     |    |     |                        t                             |                                |        
 |     |    |     |          ______________|_________________            |                                |         
what times are playing     the         nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-39120
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.707
INFO:tensorflow:Best (Exact Match) Accuracy: 0.707
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-39120
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 39120 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2692995, step = 39120
INFO:tensorflow:lr = 0.00026996594
INFO:tensorflow:global_step/sec: 10.423
INFO:tensorflow:loss = 1.2852095, step = 39220 (9.595 sec)
INFO:tensorflow:lr = 0.00026969475 (9.595 sec)
INFO:tensorflow:global_step/sec: 12.7697
INFO:tensorflow:loss = 1.2648714, step = 39320 (7.838 sec)
INFO:tensorflow:lr = 0.00026942385 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.4705
INFO:tensorflow:loss = 1.263199, step = 39420 (8.017 sec)
INFO:tensorflow:lr = 0.00026915318 (8.017 sec)
INFO:tensorflow:global_step/sec: 12.5405
INFO:tensorflow:loss = 1.2712208, step = 39520 (7.972 sec)
INFO:tensorflow:lr = 0.0002688828 (7.972 sec)
INFO:tensorflow:global_step/sec: 12.4456
INFO:tensorflow:loss = 1.2705394, step = 39620 (8.033 sec)
INFO:tensorflow:lr = 0.0002686127 (8.033 sec)
INFO:tensorflow:global_step/sec: 12.6205
INFO:tensorflow:loss = 1.271941, step = 39720 (7.926 sec)
INFO:tensorflow:lr = 0.00026834288 (7.925 sec)
INFO:tensorflow:global_step/sec: 12.7271
INFO:tensorflow:loss = 1.2671064, step = 39820 (7.855 sec)
INFO:tensorflow:lr = 0.00026807332 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.8522
INFO:tensorflow:loss = 1.2827927, step = 39920 (7.787 sec)
INFO:tensorflow:lr = 0.00026780402 (7.787 sec)
INFO:tensorflow:global_step/sec: 13.0029
INFO:tensorflow:loss = 1.2829088, step = 40020 (7.690 sec)
INFO:tensorflow:lr = 0.000267535 (7.690 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.24724
INFO:tensorflow:loss = 1.2646608, step = 40120 (12.122 sec)
INFO:tensorflow:lr = 0.00026726627 (12.124 sec)
INFO:tensorflow:global_step/sec: 12.9064
INFO:tensorflow:loss = 1.2660892, step = 40220 (7.746 sec)
INFO:tensorflow:lr = 0.00026699778 (7.744 sec)
INFO:tensorflow:global_step/sec: 12.6494
INFO:tensorflow:loss = 1.2711158, step = 40320 (7.913 sec)
INFO:tensorflow:lr = 0.00026672956 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.736
INFO:tensorflow:loss = 1.2661604, step = 40420 (7.846 sec)
INFO:tensorflow:lr = 0.00026646163 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.5546
INFO:tensorflow:loss = 1.2606105, step = 40520 (7.964 sec)
INFO:tensorflow:lr = 0.00026619397 (7.961 sec)
INFO:tensorflow:global_step/sec: 12.7677
INFO:tensorflow:loss = 1.27701, step = 40620 (7.831 sec)
INFO:tensorflow:lr = 0.00026592656 (7.831 sec)
INFO:tensorflow:global_step/sec: 12.938
INFO:tensorflow:loss = 1.2607424, step = 40720 (7.732 sec)
INFO:tensorflow:lr = 0.00026565944 (7.733 sec)
INFO:tensorflow:global_step/sec: 12.8514
INFO:tensorflow:loss = 1.270835, step = 40820 (7.782 sec)
INFO:tensorflow:lr = 0.0002653926 (7.781 sec)
INFO:tensorflow:global_step/sec: 12.6607
INFO:tensorflow:loss = 1.2720766, step = 40920 (7.900 sec)
INFO:tensorflow:lr = 0.00026512597 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.5758
INFO:tensorflow:loss = 1.2690309, step = 41020 (7.947 sec)
INFO:tensorflow:lr = 0.00026485967 (7.947 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.24971
INFO:tensorflow:loss = 1.2594911, step = 41120 (12.123 sec)
INFO:tensorflow:lr = 0.00026459363 (12.123 sec)
INFO:tensorflow:global_step/sec: 12.9862
INFO:tensorflow:loss = 1.283308, step = 41220 (7.699 sec)
INFO:tensorflow:lr = 0.00026432783 (7.700 sec)
INFO:tensorflow:global_step/sec: 12.7218
INFO:tensorflow:loss = 1.2755083, step = 41320 (7.865 sec)
INFO:tensorflow:lr = 0.00026406228 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.7322
INFO:tensorflow:loss = 1.268201, step = 41420 (7.849 sec)
INFO:tensorflow:lr = 0.000263797 (7.849 sec)
INFO:tensorflow:global_step/sec: 12.4848
INFO:tensorflow:loss = 1.2764183, step = 41520 (8.015 sec)
INFO:tensorflow:lr = 0.00026353204 (8.013 sec)
INFO:tensorflow:global_step/sec: 12.5466
INFO:tensorflow:loss = 1.2742758, step = 41620 (7.972 sec)
INFO:tensorflow:lr = 0.0002632673 (7.976 sec)
INFO:tensorflow:global_step/sec: 12.8135
INFO:tensorflow:loss = 1.2566481, step = 41720 (7.798 sec)
INFO:tensorflow:lr = 0.00026300285 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.9486
INFO:tensorflow:loss = 1.261928, step = 41820 (7.723 sec)
INFO:tensorflow:lr = 0.00026273864 (7.720 sec)
INFO:tensorflow:global_step/sec: 12.9607
INFO:tensorflow:loss = 1.2595774, step = 41920 (7.719 sec)
INFO:tensorflow:lr = 0.00026247473 (7.720 sec)
INFO:tensorflow:global_step/sec: 12.8198
INFO:tensorflow:loss = 1.2714173, step = 42020 (7.802 sec)
INFO:tensorflow:lr = 0.00026221108 (7.803 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.4317
INFO:tensorflow:loss = 1.2644148, step = 42120 (11.855 sec)
INFO:tensorflow:lr = 0.0002619477 (11.853 sec)
INFO:tensorflow:global_step/sec: 12.9926
INFO:tensorflow:loss = 1.2653011, step = 42220 (7.698 sec)
INFO:tensorflow:lr = 0.00026168456 (7.702 sec)
INFO:tensorflow:global_step/sec: 12.6806
INFO:tensorflow:loss = 1.2612933, step = 42320 (7.890 sec)
INFO:tensorflow:lr = 0.00026142164 (7.887 sec)
INFO:tensorflow:global_step/sec: 12.8074
INFO:tensorflow:loss = 1.2797445, step = 42420 (7.805 sec)
INFO:tensorflow:lr = 0.00026115906 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.6395
INFO:tensorflow:loss = 1.2628508, step = 42520 (7.913 sec)
INFO:tensorflow:lr = 0.00026089672 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.8445
INFO:tensorflow:loss = 1.2819867, step = 42620 (7.788 sec)
INFO:tensorflow:lr = 0.00026063464 (7.789 sec)
INFO:tensorflow:global_step/sec: 12.8711
INFO:tensorflow:loss = 1.2706252, step = 42720 (7.768 sec)
INFO:tensorflow:lr = 0.00026037282 (7.767 sec)
INFO:tensorflow:global_step/sec: 12.3352
INFO:tensorflow:loss = 1.2649037, step = 42820 (8.102 sec)
INFO:tensorflow:lr = 0.00026011126 (8.101 sec)
INFO:tensorflow:global_step/sec: 12.8112
INFO:tensorflow:loss = 1.2671568, step = 42920 (7.809 sec)
INFO:tensorflow:lr = 0.00025985 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.9254
INFO:tensorflow:loss = 1.2667608, step = 43020 (7.741 sec)
INFO:tensorflow:lr = 0.00025958894 (7.741 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.3895
INFO:tensorflow:loss = 1.2655711, step = 43120 (11.913 sec)
INFO:tensorflow:lr = 0.0002593282 (11.913 sec)
INFO:tensorflow:global_step/sec: 12.4018
INFO:tensorflow:loss = 1.267358, step = 43220 (8.066 sec)
INFO:tensorflow:lr = 0.0002590677 (8.069 sec)
INFO:tensorflow:global_step/sec: 12.6024
INFO:tensorflow:loss = 1.2700015, step = 43320 (7.935 sec)
INFO:tensorflow:lr = 0.00025880744 (7.934 sec)
INFO:tensorflow:global_step/sec: 12.5451
INFO:tensorflow:loss = 1.2641869, step = 43420 (7.972 sec)
INFO:tensorflow:lr = 0.00025854746 (7.972 sec)
INFO:tensorflow:global_step/sec: 12.8976
INFO:tensorflow:loss = 1.2638835, step = 43520 (7.755 sec)
INFO:tensorflow:lr = 0.00025828776 (7.753 sec)
INFO:tensorflow:global_step/sec: 12.6097
INFO:tensorflow:loss = 1.2561631, step = 43620 (7.927 sec)
INFO:tensorflow:lr = 0.0002580283 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.8381
INFO:tensorflow:loss = 1.2625241, step = 43720 (7.793 sec)
INFO:tensorflow:lr = 0.0002577691 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.825
INFO:tensorflow:loss = 1.2693264, step = 43820 (7.798 sec)
INFO:tensorflow:lr = 0.00025751017 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.7736
INFO:tensorflow:loss = 1.2730483, step = 43920 (7.822 sec)
INFO:tensorflow:lr = 0.0002572515 (7.823 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.75995
INFO:tensorflow:loss = 1.2587811, step = 44020 (11.418 sec)
INFO:tensorflow:lr = 0.00025699308 (11.420 sec)
INFO:tensorflow:global_step/sec: 12.8387
INFO:tensorflow:loss = 1.2614508, step = 44120 (7.790 sec)
INFO:tensorflow:lr = 0.0002567349 (7.791 sec)
INFO:tensorflow:global_step/sec: 12.6823
INFO:tensorflow:loss = 1.2701207, step = 44220 (7.886 sec)
INFO:tensorflow:lr = 0.000256477 (7.886 sec)
INFO:tensorflow:global_step/sec: 12.8214
INFO:tensorflow:loss = 1.2705317, step = 44320 (7.802 sec)
INFO:tensorflow:lr = 0.00025621938 (7.799 sec)
INFO:tensorflow:global_step/sec: 12.4534
INFO:tensorflow:loss = 1.2627566, step = 44420 (8.030 sec)
INFO:tensorflow:lr = 0.00025596202 (8.030 sec)
INFO:tensorflow:global_step/sec: 12.6966
INFO:tensorflow:loss = 1.2665414, step = 44520 (7.870 sec)
INFO:tensorflow:lr = 0.0002557049 (7.870 sec)
INFO:tensorflow:global_step/sec: 12.9501
INFO:tensorflow:loss = 1.2893751, step = 44620 (7.722 sec)
INFO:tensorflow:lr = 0.00025544802 (7.722 sec)
INFO:tensorflow:global_step/sec: 13.0372
INFO:tensorflow:loss = 1.2678509, step = 44720 (7.670 sec)
INFO:tensorflow:lr = 0.0002551914 (7.670 sec)
INFO:tensorflow:global_step/sec: 12.8701
INFO:tensorflow:loss = 1.2665724, step = 44820 (7.770 sec)
INFO:tensorflow:lr = 0.00025493503 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.7671
INFO:tensorflow:loss = 1.266214, step = 44920 (7.839 sec)
INFO:tensorflow:lr = 0.00025467898 (7.838 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.40537
INFO:tensorflow:loss = 1.2608075, step = 45020 (10.633 sec)
INFO:tensorflow:lr = 0.00025442315 (10.633 sec)
INFO:tensorflow:global_step/sec: 12.7037
INFO:tensorflow:loss = 1.264033, step = 45120 (7.869 sec)
INFO:tensorflow:lr = 0.00025416756 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.8665
INFO:tensorflow:loss = 1.2578142, step = 45220 (7.774 sec)
INFO:tensorflow:lr = 0.00025391224 (7.774 sec)
INFO:tensorflow:global_step/sec: 12.4913
INFO:tensorflow:loss = 1.2547925, step = 45320 (8.004 sec)
INFO:tensorflow:lr = 0.0002536572 (8.004 sec)
INFO:tensorflow:global_step/sec: 12.595
INFO:tensorflow:loss = 1.2743986, step = 45420 (7.937 sec)
INFO:tensorflow:lr = 0.0002534024 (7.939 sec)
INFO:tensorflow:global_step/sec: 12.6593
INFO:tensorflow:loss = 1.266757, step = 45520 (7.897 sec)
INFO:tensorflow:lr = 0.00025314782 (7.899 sec)
INFO:tensorflow:global_step/sec: 12.8904
INFO:tensorflow:loss = 1.2690803, step = 45620 (7.760 sec)
INFO:tensorflow:lr = 0.00025289354 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.8386
INFO:tensorflow:loss = 1.2695453, step = 45720 (7.792 sec)
INFO:tensorflow:lr = 0.0002526395 (7.790 sec)
INFO:tensorflow:global_step/sec: 12.6332
INFO:tensorflow:loss = 1.2680589, step = 45820 (7.911 sec)
INFO:tensorflow:lr = 0.0002523857 (7.910 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.4824
INFO:tensorflow:loss = 1.2544335, step = 45920 (8.014 sec)
INFO:tensorflow:lr = 0.0002521322 (8.014 sec)
INFO:tensorflow:global_step/sec: 10.8606
INFO:tensorflow:loss = 1.261169, step = 46020 (9.218 sec)
INFO:tensorflow:lr = 0.00025187893 (9.220 sec)
INFO:tensorflow:global_step/sec: 12.6674
INFO:tensorflow:loss = 1.2620407, step = 46120 (7.885 sec)
INFO:tensorflow:lr = 0.0002516259 (7.884 sec)
INFO:tensorflow:global_step/sec: 12.6643
INFO:tensorflow:loss = 1.2677541, step = 46220 (7.893 sec)
INFO:tensorflow:lr = 0.00025137313 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.7899
INFO:tensorflow:loss = 1.254288, step = 46320 (7.818 sec)
INFO:tensorflow:lr = 0.00025112063 (7.819 sec)
INFO:tensorflow:global_step/sec: 12.7355
INFO:tensorflow:loss = 1.2622324, step = 46420 (7.851 sec)
INFO:tensorflow:lr = 0.00025086835 (7.850 sec)
INFO:tensorflow:global_step/sec: 12.77
INFO:tensorflow:loss = 1.2603494, step = 46520 (7.838 sec)
INFO:tensorflow:lr = 0.00025061634 (7.838 sec)
INFO:tensorflow:global_step/sec: 12.8105
INFO:tensorflow:loss = 1.274346, step = 46620 (7.801 sec)
INFO:tensorflow:lr = 0.0002503646 (7.801 sec)
INFO:tensorflow:global_step/sec: 12.8057
INFO:tensorflow:loss = 1.2791383, step = 46720 (7.808 sec)
INFO:tensorflow:lr = 0.0002501131 (7.809 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.6813
INFO:tensorflow:loss = 1.2684876, step = 46820 (7.892 sec)
INFO:tensorflow:lr = 0.00024986186 (7.890 sec)
INFO:tensorflow:global_step/sec: 11.2116
INFO:tensorflow:loss = 1.261704, step = 46920 (8.916 sec)
INFO:tensorflow:lr = 0.00024961086 (8.916 sec)
INFO:tensorflow:global_step/sec: 12.5528
INFO:tensorflow:loss = 1.2601739, step = 47020 (7.968 sec)
INFO:tensorflow:lr = 0.00024936014 (7.969 sec)
INFO:tensorflow:global_step/sec: 12.4465
INFO:tensorflow:loss = 1.2588917, step = 47120 (8.035 sec)
INFO:tensorflow:lr = 0.0002491096 (8.035 sec)
INFO:tensorflow:global_step/sec: 12.875
INFO:tensorflow:loss = 1.271802, step = 47220 (7.764 sec)
INFO:tensorflow:lr = 0.0002488594 (7.765 sec)
INFO:tensorflow:global_step/sec: 12.8335
INFO:tensorflow:loss = 1.263241, step = 47320 (7.789 sec)
INFO:tensorflow:lr = 0.00024860943 (7.788 sec)
INFO:tensorflow:global_step/sec: 13.0207
INFO:tensorflow:loss = 1.2612357, step = 47420 (7.685 sec)
INFO:tensorflow:lr = 0.0002483597 (7.685 sec)
INFO:tensorflow:global_step/sec: 12.6693
INFO:tensorflow:loss = 1.2592645, step = 47520 (7.888 sec)
INFO:tensorflow:lr = 0.0002481102 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.7021
INFO:tensorflow:loss = 1.2634231, step = 47620 (7.877 sec)
INFO:tensorflow:lr = 0.00024786094 (7.876 sec)
INFO:tensorflow:global_step/sec: 12.7586
INFO:tensorflow:loss = 1.2658721, step = 47720 (7.837 sec)
INFO:tensorflow:lr = 0.00024761196 (7.842 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.901
INFO:tensorflow:loss = 1.2613206, step = 47820 (8.403 sec)
INFO:tensorflow:lr = 0.00024736323 (8.400 sec)
INFO:tensorflow:global_step/sec: 11.2274
INFO:tensorflow:loss = 1.2668675, step = 47920 (8.908 sec)
INFO:tensorflow:lr = 0.00024711475 (8.907 sec)
INFO:tensorflow:global_step/sec: 12.6344
INFO:tensorflow:loss = 1.2707262, step = 48020 (7.912 sec)
INFO:tensorflow:lr = 0.00024686652 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.6208
INFO:tensorflow:loss = 1.264168, step = 48120 (7.926 sec)
INFO:tensorflow:lr = 0.00024661855 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.4144
INFO:tensorflow:loss = 1.2581247, step = 48220 (8.055 sec)
INFO:tensorflow:lr = 0.00024637082 (8.055 sec)
INFO:tensorflow:global_step/sec: 12.1425
INFO:tensorflow:loss = 1.2826554, step = 48320 (8.229 sec)
INFO:tensorflow:lr = 0.00024612332 (8.231 sec)
INFO:tensorflow:global_step/sec: 12.3167
INFO:tensorflow:loss = 1.2596526, step = 48420 (8.125 sec)
INFO:tensorflow:lr = 0.0002458761 (8.124 sec)
INFO:tensorflow:global_step/sec: 12.5863
INFO:tensorflow:loss = 1.2663782, step = 48520 (7.940 sec)
INFO:tensorflow:lr = 0.00024562908 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.4722
INFO:tensorflow:loss = 1.2596316, step = 48620 (8.022 sec)
INFO:tensorflow:lr = 0.00024538234 (8.019 sec)
INFO:tensorflow:global_step/sec: 12.3972
INFO:tensorflow:loss = 1.2628276, step = 48720 (8.062 sec)
INFO:tensorflow:lr = 0.00024513586 (8.062 sec)
INFO:tensorflow:global_step/sec: 12.812
INFO:tensorflow:loss = 1.267219, step = 48820 (7.805 sec)
INFO:tensorflow:lr = 0.0002448896 (7.805 sec)
INFO:tensorflow:Saving checkpoints for 48900 into ../model/lstm_transformer/model.ckpt.
WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/training/saver.py:963: remove_checkpoint (from tensorflow.python.training.checkpoint_management) is deprecated and will be removed in a future version.
Instructions for updating:
Use standard file APIs to delete files with this prefix.
INFO:tensorflow:Loss for final step: 1.2682308.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-48900
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-48900
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.706
INFO:tensorflow:Best (Exact Match) Accuracy: 0.707
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-48900
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 48900 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.263123, step = 48900
INFO:tensorflow:lr = 0.00024469278
INFO:tensorflow:global_step/sec: 9.80343
INFO:tensorflow:loss = 1.2753992, step = 49000 (10.205 sec)
INFO:tensorflow:lr = 0.000244447 (10.206 sec)
INFO:tensorflow:global_step/sec: 12.3248
INFO:tensorflow:loss = 1.2618505, step = 49100 (8.117 sec)
INFO:tensorflow:lr = 0.00024420145 (8.114 sec)
INFO:tensorflow:global_step/sec: 12.7277
INFO:tensorflow:loss = 1.2551093, step = 49200 (7.851 sec)
INFO:tensorflow:lr = 0.00024395615 (7.852 sec)
INFO:tensorflow:global_step/sec: 13.0713
INFO:tensorflow:loss = 1.2688679, step = 49300 (7.651 sec)
INFO:tensorflow:lr = 0.00024371107 (7.650 sec)
INFO:tensorflow:global_step/sec: 12.8647
INFO:tensorflow:loss = 1.2720437, step = 49400 (7.774 sec)
INFO:tensorflow:lr = 0.00024346625 (7.775 sec)
INFO:tensorflow:global_step/sec: 12.7116
INFO:tensorflow:loss = 1.2706873, step = 49500 (7.866 sec)
INFO:tensorflow:lr = 0.00024322169 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.5179
INFO:tensorflow:loss = 1.2638872, step = 49600 (7.992 sec)
INFO:tensorflow:lr = 0.00024297737 (7.991 sec)
INFO:tensorflow:global_step/sec: 12.5553
INFO:tensorflow:loss = 1.2629794, step = 49700 (7.961 sec)
INFO:tensorflow:lr = 0.00024273328 (7.961 sec)
INFO:tensorflow:global_step/sec: 12.9475
INFO:tensorflow:loss = 1.2555556, step = 49800 (7.729 sec)
INFO:tensorflow:lr = 0.00024248945 (7.728 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.31103
INFO:tensorflow:loss = 1.2618929, step = 49900 (12.026 sec)
INFO:tensorflow:lr = 0.00024224588 (12.026 sec)
INFO:tensorflow:global_step/sec: 12.9152
INFO:tensorflow:loss = 1.2585716, step = 50000 (7.749 sec)
INFO:tensorflow:lr = 0.00024200253 (7.749 sec)
INFO:tensorflow:global_step/sec: 12.8223
INFO:tensorflow:loss = 1.2602012, step = 50100 (7.793 sec)
INFO:tensorflow:lr = 0.00024175941 (7.794 sec)
INFO:tensorflow:global_step/sec: 13.0814
INFO:tensorflow:loss = 1.2600421, step = 50200 (7.650 sec)
INFO:tensorflow:lr = 0.00024151658 (7.649 sec)
INFO:tensorflow:global_step/sec: 12.9555
INFO:tensorflow:loss = 1.2640244, step = 50300 (7.713 sec)
INFO:tensorflow:lr = 0.00024127394 (7.713 sec)
INFO:tensorflow:global_step/sec: 12.7933
INFO:tensorflow:loss = 1.2591022, step = 50400 (7.820 sec)
INFO:tensorflow:lr = 0.0002410316 (7.825 sec)
INFO:tensorflow:global_step/sec: 12.3763
INFO:tensorflow:loss = 1.2563342, step = 50500 (8.080 sec)
INFO:tensorflow:lr = 0.00024078948 (8.076 sec)
INFO:tensorflow:global_step/sec: 12.6579
INFO:tensorflow:loss = 1.251954, step = 50600 (7.897 sec)
INFO:tensorflow:lr = 0.0002405476 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.8405
INFO:tensorflow:loss = 1.2703358, step = 50700 (7.795 sec)
INFO:tensorflow:lr = 0.00024030596 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.7567
INFO:tensorflow:loss = 1.260641, step = 50800 (7.839 sec)
INFO:tensorflow:lr = 0.00024006456 (7.839 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.37615
INFO:tensorflow:loss = 1.2584833, step = 50900 (11.932 sec)
INFO:tensorflow:lr = 0.00023982344 (11.932 sec)
INFO:tensorflow:global_step/sec: 12.8102
INFO:tensorflow:loss = 1.2630175, step = 51000 (7.805 sec)
INFO:tensorflow:lr = 0.00023958248 (7.805 sec)
INFO:tensorflow:global_step/sec: 12.8743
INFO:tensorflow:loss = 1.2574093, step = 51100 (7.768 sec)
INFO:tensorflow:lr = 0.00023934185 (7.768 sec)
INFO:tensorflow:global_step/sec: 12.9835
INFO:tensorflow:loss = 1.2609439, step = 51200 (7.705 sec)
INFO:tensorflow:lr = 0.0002391014 (7.705 sec)
INFO:tensorflow:global_step/sec: 12.8867
INFO:tensorflow:loss = 1.2654866, step = 51300 (7.757 sec)
INFO:tensorflow:lr = 0.00023886122 (7.756 sec)
INFO:tensorflow:global_step/sec: 12.7474
INFO:tensorflow:loss = 1.2698414, step = 51400 (7.844 sec)
INFO:tensorflow:lr = 0.00023862127 (7.844 sec)
INFO:tensorflow:global_step/sec: 12.7932
INFO:tensorflow:loss = 1.2593272, step = 51500 (7.817 sec)
INFO:tensorflow:lr = 0.00023838157 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.6452
INFO:tensorflow:loss = 1.253849, step = 51600 (7.914 sec)
INFO:tensorflow:lr = 0.00023814212 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.6491
INFO:tensorflow:loss = 1.2664359, step = 51700 (7.906 sec)
INFO:tensorflow:lr = 0.00023790292 (7.905 sec)
INFO:tensorflow:global_step/sec: 12.6054
INFO:tensorflow:loss = 1.2593892, step = 51800 (7.927 sec)
INFO:tensorflow:lr = 0.0002376639 (7.928 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.3781
INFO:tensorflow:loss = 1.2685262, step = 51900 (11.940 sec)
INFO:tensorflow:lr = 0.0002374252 (11.941 sec)
INFO:tensorflow:global_step/sec: 12.5037
INFO:tensorflow:loss = 1.263798, step = 52000 (7.997 sec)
INFO:tensorflow:lr = 0.00023718669 (7.997 sec)
INFO:tensorflow:global_step/sec: 12.886
INFO:tensorflow:loss = 1.2689533, step = 52100 (7.756 sec)
INFO:tensorflow:lr = 0.00023694841 (7.756 sec)
INFO:tensorflow:global_step/sec: 12.7961
INFO:tensorflow:loss = 1.27047, step = 52200 (7.823 sec)
INFO:tensorflow:lr = 0.0002367104 (7.823 sec)
INFO:tensorflow:global_step/sec: 13.0623
INFO:tensorflow:loss = 1.2621255, step = 52300 (7.648 sec)
INFO:tensorflow:lr = 0.00023647262 (7.650 sec)
INFO:tensorflow:global_step/sec: 12.8008
INFO:tensorflow:loss = 1.270298, step = 52400 (7.812 sec)
INFO:tensorflow:lr = 0.00023623506 (7.811 sec)
INFO:tensorflow:global_step/sec: 12.8887
INFO:tensorflow:loss = 1.2604018, step = 52500 (7.760 sec)
INFO:tensorflow:lr = 0.00023599774 (7.761 sec)
INFO:tensorflow:global_step/sec: 12.717
INFO:tensorflow:loss = 1.2635633, step = 52600 (7.862 sec)
INFO:tensorflow:lr = 0.0002357607 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.6579
INFO:tensorflow:loss = 1.2612284, step = 52700 (7.900 sec)
INFO:tensorflow:lr = 0.00023552388 (7.897 sec)
INFO:tensorflow:global_step/sec: 12.7953
INFO:tensorflow:loss = 1.258312, step = 52800 (7.821 sec)
INFO:tensorflow:lr = 0.0002352873 (7.820 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.38183
INFO:tensorflow:loss = 1.2634532, step = 52900 (11.925 sec)
INFO:tensorflow:lr = 0.00023505092 (11.929 sec)
INFO:tensorflow:global_step/sec: 12.5748
INFO:tensorflow:loss = 1.2694097, step = 53000 (7.953 sec)
INFO:tensorflow:lr = 0.00023481481 (7.949 sec)
INFO:tensorflow:global_step/sec: 12.8424
INFO:tensorflow:loss = 1.2625628, step = 53100 (7.792 sec)
INFO:tensorflow:lr = 0.00023457894 (7.791 sec)
INFO:tensorflow:global_step/sec: 12.5576
INFO:tensorflow:loss = 1.260535, step = 53200 (7.964 sec)
INFO:tensorflow:lr = 0.00023434329 (7.965 sec)
INFO:tensorflow:global_step/sec: 12.7491
INFO:tensorflow:loss = 1.2549899, step = 53300 (7.843 sec)
INFO:tensorflow:lr = 0.0002341079 (7.843 sec)
INFO:tensorflow:global_step/sec: 12.7266
INFO:tensorflow:loss = 1.2714366, step = 53400 (7.852 sec)
INFO:tensorflow:lr = 0.00023387272 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.7257
INFO:tensorflow:loss = 1.2598583, step = 53500 (7.863 sec)
INFO:tensorflow:lr = 0.00023363781 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.9742
INFO:tensorflow:loss = 1.2618462, step = 53600 (7.710 sec)
INFO:tensorflow:lr = 0.0002334031 (7.707 sec)
INFO:tensorflow:global_step/sec: 12.7653
INFO:tensorflow:loss = 1.2702688, step = 53700 (7.828 sec)
INFO:tensorflow:lr = 0.00023316864 (7.828 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.79073
INFO:tensorflow:loss = 1.2538612, step = 53800 (11.378 sec)
INFO:tensorflow:lr = 0.00023293443 (11.380 sec)
INFO:tensorflow:global_step/sec: 13.0106
INFO:tensorflow:loss = 1.2529118, step = 53900 (7.687 sec)
INFO:tensorflow:lr = 0.00023270043 (7.685 sec)
INFO:tensorflow:global_step/sec: 12.9886
INFO:tensorflow:loss = 1.2524719, step = 54000 (7.694 sec)
INFO:tensorflow:lr = 0.00023246667 (7.695 sec)
INFO:tensorflow:global_step/sec: 12.6384
INFO:tensorflow:loss = 1.2778753, step = 54100 (7.917 sec)
INFO:tensorflow:lr = 0.00023223316 (7.917 sec)
INFO:tensorflow:global_step/sec: 12.5824
INFO:tensorflow:loss = 1.2629167, step = 54200 (7.943 sec)
INFO:tensorflow:lr = 0.00023199987 (7.946 sec)
INFO:tensorflow:global_step/sec: 12.8335
INFO:tensorflow:loss = 1.2570986, step = 54300 (7.792 sec)
INFO:tensorflow:lr = 0.00023176681 (7.789 sec)
INFO:tensorflow:global_step/sec: 12.6558
INFO:tensorflow:loss = 1.2723862, step = 54400 (7.902 sec)
INFO:tensorflow:lr = 0.00023153402 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.8133
INFO:tensorflow:loss = 1.256413, step = 54500 (7.804 sec)
INFO:tensorflow:lr = 0.00023130143 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.7269
INFO:tensorflow:loss = 1.2575724, step = 54600 (7.857 sec)
INFO:tensorflow:lr = 0.00023106908 (7.858 sec)
INFO:tensorflow:global_step/sec: 12.5403
INFO:tensorflow:loss = 1.272584, step = 54700 (7.975 sec)
INFO:tensorflow:lr = 0.00023083696 (7.976 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.19518
INFO:tensorflow:loss = 1.2527137, step = 54800 (10.875 sec)
INFO:tensorflow:lr = 0.0002306051 (10.876 sec)
INFO:tensorflow:global_step/sec: 12.491
INFO:tensorflow:loss = 1.2544173, step = 54900 (8.012 sec)
INFO:tensorflow:lr = 0.00023037342 (8.009 sec)
INFO:tensorflow:global_step/sec: 13.0044
INFO:tensorflow:loss = 1.2695364, step = 55000 (7.683 sec)
INFO:tensorflow:lr = 0.00023014202 (7.691 sec)
INFO:tensorflow:global_step/sec: 12.6771
INFO:tensorflow:loss = 1.2688967, step = 55100 (7.888 sec)
INFO:tensorflow:lr = 0.00022991082 (7.880 sec)
INFO:tensorflow:global_step/sec: 12.7627
INFO:tensorflow:loss = 1.2663212, step = 55200 (7.835 sec)
INFO:tensorflow:lr = 0.00022967989 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.6703
INFO:tensorflow:loss = 1.2508467, step = 55300 (7.897 sec)
INFO:tensorflow:lr = 0.00022944914 (7.894 sec)
INFO:tensorflow:global_step/sec: 12.7355
INFO:tensorflow:loss = 1.2672036, step = 55400 (7.849 sec)
INFO:tensorflow:lr = 0.00022921867 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.8933
INFO:tensorflow:loss = 1.2606906, step = 55500 (7.755 sec)
INFO:tensorflow:lr = 0.0002289884 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.7887
INFO:tensorflow:loss = 1.2555453, step = 55600 (7.826 sec)
INFO:tensorflow:lr = 0.0002287584 (7.825 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.3639
INFO:tensorflow:loss = 1.2551997, step = 55700 (8.091 sec)
INFO:tensorflow:lr = 0.00022852859 (8.089 sec)
INFO:tensorflow:global_step/sec: 10.6991
INFO:tensorflow:loss = 1.2652216, step = 55800 (9.337 sec)
INFO:tensorflow:lr = 0.00022829902 (9.342 sec)
INFO:tensorflow:global_step/sec: 12.824
INFO:tensorflow:loss = 1.2569361, step = 55900 (7.800 sec)
INFO:tensorflow:lr = 0.00022806968 (7.797 sec)
INFO:tensorflow:global_step/sec: 12.794
INFO:tensorflow:loss = 1.2683395, step = 56000 (7.815 sec)
INFO:tensorflow:lr = 0.00022784059 (7.812 sec)
INFO:tensorflow:global_step/sec: 12.9955
INFO:tensorflow:loss = 1.264496, step = 56100 (7.695 sec)
INFO:tensorflow:lr = 0.00022761173 (7.695 sec)
INFO:tensorflow:global_step/sec: 13.0333
INFO:tensorflow:loss = 1.2644389, step = 56200 (7.672 sec)
INFO:tensorflow:lr = 0.00022738309 (7.676 sec)
INFO:tensorflow:global_step/sec: 13.022
INFO:tensorflow:loss = 1.253439, step = 56300 (7.679 sec)
INFO:tensorflow:lr = 0.00022715465 (7.676 sec)
INFO:tensorflow:global_step/sec: 12.5266
INFO:tensorflow:loss = 1.2558391, step = 56400 (7.983 sec)
INFO:tensorflow:lr = 0.00022692647 (7.984 sec)
INFO:tensorflow:global_step/sec: 12.7366
INFO:tensorflow:loss = 1.2584279, step = 56500 (7.855 sec)
INFO:tensorflow:lr = 0.00022669851 (7.854 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2942
INFO:tensorflow:loss = 1.2605096, step = 56600 (8.132 sec)
INFO:tensorflow:lr = 0.00022647077 (8.133 sec)
INFO:tensorflow:global_step/sec: 10.8588
INFO:tensorflow:loss = 1.2645557, step = 56700 (9.207 sec)
INFO:tensorflow:lr = 0.0002262433 (9.205 sec)
INFO:tensorflow:global_step/sec: 12.9058
INFO:tensorflow:loss = 1.257235, step = 56800 (7.751 sec)
INFO:tensorflow:lr = 0.00022601604 (7.751 sec)
INFO:tensorflow:global_step/sec: 12.6226
INFO:tensorflow:loss = 1.259087, step = 56900 (7.924 sec)
INFO:tensorflow:lr = 0.00022578899 (7.925 sec)
INFO:tensorflow:global_step/sec: 12.6459
INFO:tensorflow:loss = 1.2512816, step = 57000 (7.905 sec)
INFO:tensorflow:lr = 0.00022556218 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.8169
INFO:tensorflow:loss = 1.256032, step = 57100 (7.800 sec)
INFO:tensorflow:lr = 0.00022533562 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.7711
INFO:tensorflow:loss = 1.2535781, step = 57200 (7.830 sec)
INFO:tensorflow:lr = 0.00022510927 (7.829 sec)
INFO:tensorflow:global_step/sec: 12.7293
INFO:tensorflow:loss = 1.257878, step = 57300 (7.863 sec)
INFO:tensorflow:lr = 0.0002248831 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.5132
INFO:tensorflow:loss = 1.2791443, step = 57400 (7.988 sec)
INFO:tensorflow:lr = 0.00022465723 (7.987 sec)
INFO:tensorflow:global_step/sec: 13.0392
INFO:tensorflow:loss = 1.2567543, step = 57500 (7.668 sec)
INFO:tensorflow:lr = 0.00022443154 (7.669 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1479
INFO:tensorflow:loss = 1.2558892, step = 57600 (8.235 sec)
INFO:tensorflow:lr = 0.0002242061 (8.235 sec)
INFO:tensorflow:global_step/sec: 11.7853
INFO:tensorflow:loss = 1.270159, step = 57700 (8.479 sec)
INFO:tensorflow:lr = 0.00022398087 (8.480 sec)
INFO:tensorflow:global_step/sec: 12.9312
INFO:tensorflow:loss = 1.2561911, step = 57800 (7.738 sec)
INFO:tensorflow:lr = 0.00022375588 (7.737 sec)
INFO:tensorflow:global_step/sec: 12.8943
INFO:tensorflow:loss = 1.2581128, step = 57900 (7.751 sec)
INFO:tensorflow:lr = 0.0002235311 (7.751 sec)
INFO:tensorflow:global_step/sec: 12.89
INFO:tensorflow:loss = 1.2589202, step = 58000 (7.763 sec)
INFO:tensorflow:lr = 0.00022330656 (7.763 sec)
INFO:tensorflow:global_step/sec: 13.0328
INFO:tensorflow:loss = 1.2635732, step = 58100 (7.668 sec)
INFO:tensorflow:lr = 0.00022308226 (7.670 sec)
INFO:tensorflow:global_step/sec: 12.9888
INFO:tensorflow:loss = 1.2706214, step = 58200 (7.699 sec)
INFO:tensorflow:lr = 0.00022285814 (7.699 sec)
INFO:tensorflow:global_step/sec: 12.7051
INFO:tensorflow:loss = 1.258386, step = 58300 (7.871 sec)
INFO:tensorflow:lr = 0.00022263429 (7.879 sec)
INFO:tensorflow:global_step/sec: 13.0078
INFO:tensorflow:loss = 1.2566429, step = 58400 (7.687 sec)
INFO:tensorflow:lr = 0.00022241064 (7.676 sec)
INFO:tensorflow:global_step/sec: 12.6443
INFO:tensorflow:loss = 1.2667817, step = 58500 (7.910 sec)
INFO:tensorflow:lr = 0.00022218723 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.7619
INFO:tensorflow:loss = 1.2693475, step = 58600 (7.835 sec)
INFO:tensorflow:lr = 0.00022196402 (7.835 sec)
INFO:tensorflow:Saving checkpoints for 58680 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2575451.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-58680
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-58680
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.714
INFO:tensorflow:Best (Exact Match) Accuracy: 0.714
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-58680
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 58680 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2724138, step = 58680
INFO:tensorflow:lr = 0.00022178564
INFO:tensorflow:global_step/sec: 10.3144
INFO:tensorflow:loss = 1.2573106, step = 58780 (9.698 sec)
INFO:tensorflow:lr = 0.00022156286 (9.706 sec)
INFO:tensorflow:global_step/sec: 12.8129
INFO:tensorflow:loss = 1.2532308, step = 58880 (7.803 sec)
INFO:tensorflow:lr = 0.00022134029 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.6229
INFO:tensorflow:loss = 1.2531558, step = 58980 (7.928 sec)
INFO:tensorflow:lr = 0.00022111794 (7.928 sec)
INFO:tensorflow:global_step/sec: 12.8638
INFO:tensorflow:loss = 1.2645673, step = 59080 (7.773 sec)
INFO:tensorflow:lr = 0.0002208958 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.4406
INFO:tensorflow:loss = 1.2638228, step = 59180 (8.039 sec)
INFO:tensorflow:lr = 0.00022067393 (8.038 sec)
INFO:tensorflow:global_step/sec: 12.6973
INFO:tensorflow:loss = 1.2559628, step = 59280 (7.877 sec)
INFO:tensorflow:lr = 0.00022045226 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.6856
INFO:tensorflow:loss = 1.256625, step = 59380 (7.876 sec)
INFO:tensorflow:lr = 0.00022023081 (7.877 sec)
INFO:tensorflow:global_step/sec: 13.3057
INFO:tensorflow:loss = 1.2582057, step = 59480 (7.517 sec)
INFO:tensorflow:lr = 0.00022000956 (7.517 sec)
INFO:tensorflow:global_step/sec: 12.5282
INFO:tensorflow:loss = 1.2669188, step = 59580 (7.982 sec)
INFO:tensorflow:lr = 0.00021978856 (7.986 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.22968
INFO:tensorflow:loss = 1.2529101, step = 59680 (12.156 sec)
INFO:tensorflow:lr = 0.00021956777 (12.151 sec)
INFO:tensorflow:global_step/sec: 12.8956
INFO:tensorflow:loss = 1.2675282, step = 59780 (7.755 sec)
INFO:tensorflow:lr = 0.00021934723 (7.760 sec)
INFO:tensorflow:global_step/sec: 12.6672
INFO:tensorflow:loss = 1.2623235, step = 59880 (7.891 sec)
INFO:tensorflow:lr = 0.00021912686 (7.889 sec)
INFO:tensorflow:global_step/sec: 12.5604
INFO:tensorflow:loss = 1.2686803, step = 59980 (7.958 sec)
INFO:tensorflow:lr = 0.00021890676 (7.956 sec)
INFO:tensorflow:global_step/sec: 12.9026
INFO:tensorflow:loss = 1.2615492, step = 60080 (7.751 sec)
INFO:tensorflow:lr = 0.00021868687 (7.753 sec)
INFO:tensorflow:global_step/sec: 12.8044
INFO:tensorflow:loss = 1.2547079, step = 60180 (7.809 sec)
INFO:tensorflow:lr = 0.00021846718 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.8346
INFO:tensorflow:loss = 1.2528274, step = 60280 (7.792 sec)
INFO:tensorflow:lr = 0.00021824775 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.9208
INFO:tensorflow:loss = 1.2669843, step = 60380 (7.741 sec)
INFO:tensorflow:lr = 0.0002180285 (7.738 sec)
INFO:tensorflow:global_step/sec: 12.735
INFO:tensorflow:loss = 1.2558151, step = 60480 (7.850 sec)
INFO:tensorflow:lr = 0.00021780949 (7.849 sec)
INFO:tensorflow:global_step/sec: 12.8776
INFO:tensorflow:loss = 1.2551497, step = 60580 (7.771 sec)
INFO:tensorflow:lr = 0.00021759068 (7.771 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.34405
INFO:tensorflow:loss = 1.2546343, step = 60680 (11.980 sec)
INFO:tensorflow:lr = 0.0002173721 (11.980 sec)
INFO:tensorflow:global_step/sec: 12.7156
INFO:tensorflow:loss = 1.2520571, step = 60780 (7.867 sec)
INFO:tensorflow:lr = 0.00021715376 (7.867 sec)
INFO:tensorflow:global_step/sec: 12.6516
INFO:tensorflow:loss = 1.2656932, step = 60880 (7.904 sec)
INFO:tensorflow:lr = 0.00021693563 (7.905 sec)
INFO:tensorflow:global_step/sec: 13.0749
INFO:tensorflow:loss = 1.2510619, step = 60980 (7.650 sec)
INFO:tensorflow:lr = 0.00021671772 (7.650 sec)
INFO:tensorflow:global_step/sec: 12.6946
INFO:tensorflow:loss = 1.2555563, step = 61080 (7.872 sec)
INFO:tensorflow:lr = 0.00021650002 (7.872 sec)
INFO:tensorflow:global_step/sec: 12.8617
INFO:tensorflow:loss = 1.2622253, step = 61180 (7.778 sec)
INFO:tensorflow:lr = 0.00021628253 (7.778 sec)
INFO:tensorflow:global_step/sec: 12.7325
INFO:tensorflow:loss = 1.2601289, step = 61280 (7.855 sec)
INFO:tensorflow:lr = 0.00021606525 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.7575
INFO:tensorflow:loss = 1.2692169, step = 61380 (7.834 sec)
INFO:tensorflow:lr = 0.00021584822 (7.833 sec)
INFO:tensorflow:global_step/sec: 12.6755
INFO:tensorflow:loss = 1.2582502, step = 61480 (7.889 sec)
INFO:tensorflow:lr = 0.00021563139 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.9292
INFO:tensorflow:loss = 1.2521135, step = 61580 (7.739 sec)
INFO:tensorflow:lr = 0.00021541478 (7.739 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.3132
INFO:tensorflow:loss = 1.2625241, step = 61680 (12.031 sec)
INFO:tensorflow:lr = 0.0002151984 (12.030 sec)
INFO:tensorflow:global_step/sec: 12.8491
INFO:tensorflow:loss = 1.2569088, step = 61780 (7.777 sec)
INFO:tensorflow:lr = 0.00021498224 (7.778 sec)
INFO:tensorflow:global_step/sec: 12.6945
INFO:tensorflow:loss = 1.2559131, step = 61880 (7.882 sec)
INFO:tensorflow:lr = 0.00021476626 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.8822
INFO:tensorflow:loss = 1.2696959, step = 61980 (7.759 sec)
INFO:tensorflow:lr = 0.00021455051 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.8127
INFO:tensorflow:loss = 1.2561213, step = 62080 (7.803 sec)
INFO:tensorflow:lr = 0.00021433501 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.8856
INFO:tensorflow:loss = 1.2621582, step = 62180 (7.766 sec)
INFO:tensorflow:lr = 0.00021411969 (7.766 sec)
INFO:tensorflow:global_step/sec: 12.5122
INFO:tensorflow:loss = 1.2536796, step = 62280 (7.991 sec)
INFO:tensorflow:lr = 0.00021390461 (7.990 sec)
INFO:tensorflow:global_step/sec: 12.3773
INFO:tensorflow:loss = 1.2566583, step = 62380 (8.081 sec)
INFO:tensorflow:lr = 0.00021368972 (8.081 sec)
INFO:tensorflow:global_step/sec: 12.6472
INFO:tensorflow:loss = 1.2600583, step = 62480 (7.900 sec)
INFO:tensorflow:lr = 0.00021347508 (7.904 sec)
INFO:tensorflow:global_step/sec: 12.6644
INFO:tensorflow:loss = 1.2559776, step = 62580 (7.902 sec)
INFO:tensorflow:lr = 0.00021326065 (7.898 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.48244
INFO:tensorflow:loss = 1.2560581, step = 62680 (11.790 sec)
INFO:tensorflow:lr = 0.0002130464 (11.791 sec)
INFO:tensorflow:global_step/sec: 12.8693
INFO:tensorflow:loss = 1.2563652, step = 62780 (7.768 sec)
INFO:tensorflow:lr = 0.0002128324 (7.767 sec)
INFO:tensorflow:global_step/sec: 12.7061
INFO:tensorflow:loss = 1.2647818, step = 62880 (7.869 sec)
INFO:tensorflow:lr = 0.0002126186 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.5926
INFO:tensorflow:loss = 1.2658582, step = 62980 (7.939 sec)
INFO:tensorflow:lr = 0.00021240504 (7.938 sec)
INFO:tensorflow:global_step/sec: 12.8705
INFO:tensorflow:loss = 1.2523164, step = 63080 (7.769 sec)
INFO:tensorflow:lr = 0.00021219168 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.7683
INFO:tensorflow:loss = 1.2602874, step = 63180 (7.837 sec)
INFO:tensorflow:lr = 0.0002119785 (7.842 sec)
INFO:tensorflow:global_step/sec: 13.0614
INFO:tensorflow:loss = 1.2652452, step = 63280 (7.655 sec)
INFO:tensorflow:lr = 0.00021176557 (7.650 sec)
INFO:tensorflow:global_step/sec: 12.6689
INFO:tensorflow:loss = 1.250535, step = 63380 (7.889 sec)
INFO:tensorflow:lr = 0.00021155283 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.726
INFO:tensorflow:loss = 1.2587569, step = 63480 (7.859 sec)
INFO:tensorflow:lr = 0.00021134033 (7.869 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.5915
INFO:tensorflow:loss = 1.2486932, step = 63580 (11.639 sec)
INFO:tensorflow:lr = 0.00021112803 (11.630 sec)
INFO:tensorflow:global_step/sec: 12.746
INFO:tensorflow:loss = 1.2581683, step = 63680 (7.845 sec)
INFO:tensorflow:lr = 0.00021091594 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.9087
INFO:tensorflow:loss = 1.2698822, step = 63780 (7.752 sec)
INFO:tensorflow:lr = 0.00021070408 (7.744 sec)
INFO:tensorflow:global_step/sec: 12.7608
INFO:tensorflow:loss = 1.2671998, step = 63880 (7.835 sec)
INFO:tensorflow:lr = 0.00021049242 (7.835 sec)
INFO:tensorflow:global_step/sec: 12.9193
INFO:tensorflow:loss = 1.2540299, step = 63980 (7.742 sec)
INFO:tensorflow:lr = 0.00021028098 (7.742 sec)
INFO:tensorflow:global_step/sec: 12.7305
INFO:tensorflow:loss = 1.2617122, step = 64080 (7.856 sec)
INFO:tensorflow:lr = 0.00021006975 (7.856 sec)
INFO:tensorflow:global_step/sec: 12.5839
INFO:tensorflow:loss = 1.2595084, step = 64180 (7.945 sec)
INFO:tensorflow:lr = 0.00020985873 (7.946 sec)
INFO:tensorflow:global_step/sec: 13.0107
INFO:tensorflow:loss = 1.2606783, step = 64280 (7.681 sec)
INFO:tensorflow:lr = 0.00020964789 (7.681 sec)
INFO:tensorflow:global_step/sec: 12.6722
INFO:tensorflow:loss = 1.2504494, step = 64380 (7.898 sec)
INFO:tensorflow:lr = 0.00020943732 (7.898 sec)
INFO:tensorflow:global_step/sec: 12.6237
INFO:tensorflow:loss = 1.2601182, step = 64480 (7.921 sec)
INFO:tensorflow:lr = 0.00020922691 (7.921 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.1461
INFO:tensorflow:loss = 1.2577064, step = 64580 (10.934 sec)
INFO:tensorflow:lr = 0.00020901677 (10.934 sec)
INFO:tensorflow:global_step/sec: 12.7236
INFO:tensorflow:loss = 1.2530557, step = 64680 (7.857 sec)
INFO:tensorflow:lr = 0.0002088068 (7.858 sec)
INFO:tensorflow:global_step/sec: 13.0769
INFO:tensorflow:loss = 1.2567884, step = 64780 (7.651 sec)
INFO:tensorflow:lr = 0.00020859703 (7.655 sec)
INFO:tensorflow:global_step/sec: 12.684
INFO:tensorflow:loss = 1.251407, step = 64880 (7.882 sec)
INFO:tensorflow:lr = 0.00020838752 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.8542
INFO:tensorflow:loss = 1.2556778, step = 64980 (7.781 sec)
INFO:tensorflow:lr = 0.00020817819 (7.781 sec)
INFO:tensorflow:global_step/sec: 12.7122
INFO:tensorflow:loss = 1.2546712, step = 65080 (7.860 sec)
INFO:tensorflow:lr = 0.00020796905 (7.860 sec)
INFO:tensorflow:global_step/sec: 12.9692
INFO:tensorflow:loss = 1.2524756, step = 65180 (7.715 sec)
INFO:tensorflow:lr = 0.00020776014 (7.715 sec)
INFO:tensorflow:global_step/sec: 13.0259
INFO:tensorflow:loss = 1.2570271, step = 65280 (7.677 sec)
INFO:tensorflow:lr = 0.00020755142 (7.680 sec)
INFO:tensorflow:global_step/sec: 12.7252
INFO:tensorflow:loss = 1.25036, step = 65380 (7.860 sec)
INFO:tensorflow:lr = 0.00020734294 (7.859 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1057
INFO:tensorflow:loss = 1.2546037, step = 65480 (8.258 sec)
INFO:tensorflow:lr = 0.00020713465 (8.258 sec)
INFO:tensorflow:global_step/sec: 10.5931
INFO:tensorflow:loss = 1.2538458, step = 65580 (9.437 sec)
INFO:tensorflow:lr = 0.00020692658 (9.435 sec)
INFO:tensorflow:global_step/sec: 12.8133
INFO:tensorflow:loss = 1.2516928, step = 65680 (7.804 sec)
INFO:tensorflow:lr = 0.00020671873 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.9175
INFO:tensorflow:loss = 1.2501926, step = 65780 (7.746 sec)
INFO:tensorflow:lr = 0.00020651106 (7.751 sec)
INFO:tensorflow:global_step/sec: 13.1593
INFO:tensorflow:loss = 1.2550164, step = 65880 (7.601 sec)
INFO:tensorflow:lr = 0.00020630364 (7.596 sec)
INFO:tensorflow:global_step/sec: 12.7002
INFO:tensorflow:loss = 1.2505937, step = 65980 (7.874 sec)
INFO:tensorflow:lr = 0.00020609639 (7.873 sec)
INFO:tensorflow:global_step/sec: 12.373
INFO:tensorflow:loss = 1.2635084, step = 66080 (8.078 sec)
INFO:tensorflow:lr = 0.00020588936 (8.079 sec)
INFO:tensorflow:global_step/sec: 12.8026
INFO:tensorflow:loss = 1.2599782, step = 66180 (7.815 sec)
INFO:tensorflow:lr = 0.00020568253 (7.814 sec)
INFO:tensorflow:global_step/sec: 12.5392
INFO:tensorflow:loss = 1.2670157, step = 66280 (7.970 sec)
INFO:tensorflow:lr = 0.00020547592 (7.970 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2205
INFO:tensorflow:loss = 1.2632979, step = 66380 (8.189 sec)
INFO:tensorflow:lr = 0.0002052695 (8.188 sec)
INFO:tensorflow:global_step/sec: 11.0385
INFO:tensorflow:loss = 1.269494, step = 66480 (9.056 sec)
INFO:tensorflow:lr = 0.00020506332 (9.058 sec)
INFO:tensorflow:global_step/sec: 12.8458
INFO:tensorflow:loss = 1.2560563, step = 66580 (7.781 sec)
INFO:tensorflow:lr = 0.00020485735 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.5578
INFO:tensorflow:loss = 1.2637135, step = 66680 (7.969 sec)
INFO:tensorflow:lr = 0.00020465154 (7.969 sec)
INFO:tensorflow:global_step/sec: 12.8306
INFO:tensorflow:loss = 1.2596672, step = 66780 (7.794 sec)
INFO:tensorflow:lr = 0.00020444595 (7.793 sec)
INFO:tensorflow:global_step/sec: 12.9435
INFO:tensorflow:loss = 1.253951, step = 66880 (7.723 sec)
INFO:tensorflow:lr = 0.00020424058 (7.723 sec)
INFO:tensorflow:global_step/sec: 12.5873
INFO:tensorflow:loss = 1.2510319, step = 66980 (7.948 sec)
INFO:tensorflow:lr = 0.00020403544 (7.948 sec)
INFO:tensorflow:global_step/sec: 12.9418
INFO:tensorflow:loss = 1.2582647, step = 67080 (7.728 sec)
INFO:tensorflow:lr = 0.00020383045 (7.728 sec)
INFO:tensorflow:global_step/sec: 12.9173
INFO:tensorflow:loss = 1.2596313, step = 67180 (7.739 sec)
INFO:tensorflow:lr = 0.00020362572 (7.739 sec)
INFO:tensorflow:global_step/sec: 12.9503
INFO:tensorflow:loss = 1.2502924, step = 67280 (7.722 sec)
INFO:tensorflow:lr = 0.00020342116 (7.722 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1161
INFO:tensorflow:loss = 1.2566557, step = 67380 (8.256 sec)
INFO:tensorflow:lr = 0.00020321681 (8.255 sec)
INFO:tensorflow:global_step/sec: 11.3069
INFO:tensorflow:loss = 1.2655523, step = 67480 (8.838 sec)
INFO:tensorflow:lr = 0.00020301268 (8.838 sec)
INFO:tensorflow:global_step/sec: 12.8634
INFO:tensorflow:loss = 1.2517667, step = 67580 (7.774 sec)
INFO:tensorflow:lr = 0.00020280876 (7.774 sec)
INFO:tensorflow:global_step/sec: 12.9586
INFO:tensorflow:loss = 1.2534577, step = 67680 (7.717 sec)
INFO:tensorflow:lr = 0.00020260502 (7.716 sec)
INFO:tensorflow:global_step/sec: 12.8067
INFO:tensorflow:loss = 1.256631, step = 67780 (7.808 sec)
INFO:tensorflow:lr = 0.00020240148 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.8087
INFO:tensorflow:loss = 1.2600688, step = 67880 (7.807 sec)
INFO:tensorflow:lr = 0.00020219819 (7.808 sec)
INFO:tensorflow:global_step/sec: 12.6442
INFO:tensorflow:loss = 1.2547219, step = 67980 (7.909 sec)
INFO:tensorflow:lr = 0.00020199506 (7.909 sec)
INFO:tensorflow:global_step/sec: 12.7405
INFO:tensorflow:loss = 1.2526922, step = 68080 (7.849 sec)
INFO:tensorflow:lr = 0.0002017922 (7.849 sec)
INFO:tensorflow:global_step/sec: 12.9993
INFO:tensorflow:loss = 1.2611421, step = 68180 (7.692 sec)
INFO:tensorflow:lr = 0.00020158946 (7.693 sec)
INFO:tensorflow:global_step/sec: 12.5706
INFO:tensorflow:loss = 1.2646718, step = 68280 (7.955 sec)
INFO:tensorflow:lr = 0.00020138695 (7.958 sec)
INFO:tensorflow:global_step/sec: 12.4633
INFO:tensorflow:loss = 1.2613611, step = 68380 (8.024 sec)
INFO:tensorflow:lr = 0.00020118465 (8.023 sec)
INFO:tensorflow:Saving checkpoints for 68460 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2606231.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-68460
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-68460
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.717
INFO:tensorflow:Best (Exact Match) Accuracy: 0.717
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-68460
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 68460 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.250214, step = 68460
INFO:tensorflow:lr = 0.00020102295
INFO:tensorflow:global_step/sec: 9.89178
INFO:tensorflow:loss = 1.2552146, step = 68560 (10.113 sec)
INFO:tensorflow:lr = 0.00020082104 (10.114 sec)
INFO:tensorflow:global_step/sec: 12.6776
INFO:tensorflow:loss = 1.2509973, step = 68660 (7.886 sec)
INFO:tensorflow:lr = 0.00020061928 (7.887 sec)
INFO:tensorflow:global_step/sec: 12.514
INFO:tensorflow:loss = 1.2553383, step = 68760 (7.996 sec)
INFO:tensorflow:lr = 0.00020041778 (7.995 sec)
INFO:tensorflow:global_step/sec: 12.7919
INFO:tensorflow:loss = 1.2552305, step = 68860 (7.817 sec)
INFO:tensorflow:lr = 0.00020021645 (7.818 sec)
INFO:tensorflow:global_step/sec: 12.8296
INFO:tensorflow:loss = 1.2542683, step = 68960 (7.791 sec)
INFO:tensorflow:lr = 0.0002000153 (7.790 sec)
INFO:tensorflow:global_step/sec: 12.5442
INFO:tensorflow:loss = 1.2532531, step = 69060 (7.971 sec)
INFO:tensorflow:lr = 0.0001998144 (7.970 sec)
INFO:tensorflow:global_step/sec: 12.781
INFO:tensorflow:loss = 1.2514119, step = 69160 (7.830 sec)
INFO:tensorflow:lr = 0.00019961369 (7.831 sec)
INFO:tensorflow:global_step/sec: 13.0693
INFO:tensorflow:loss = 1.2642561, step = 69260 (7.645 sec)
INFO:tensorflow:lr = 0.00019941316 (7.645 sec)
INFO:tensorflow:global_step/sec: 12.9636
INFO:tensorflow:loss = 1.2500038, step = 69360 (7.714 sec)
INFO:tensorflow:lr = 0.00019921285 (7.714 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.32059
INFO:tensorflow:loss = 1.2585869, step = 69460 (12.018 sec)
INFO:tensorflow:lr = 0.00019901272 (12.018 sec)
INFO:tensorflow:global_step/sec: 12.9882
INFO:tensorflow:loss = 1.2621295, step = 69560 (7.704 sec)
INFO:tensorflow:lr = 0.00019881282 (7.705 sec)
INFO:tensorflow:global_step/sec: 12.653
INFO:tensorflow:loss = 1.2571415, step = 69660 (7.898 sec)
INFO:tensorflow:lr = 0.0001986131 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.3987
INFO:tensorflow:loss = 1.252396, step = 69760 (8.065 sec)
INFO:tensorflow:lr = 0.00019841359 (8.064 sec)
INFO:tensorflow:global_step/sec: 12.7307
INFO:tensorflow:loss = 1.2507378, step = 69860 (7.860 sec)
INFO:tensorflow:lr = 0.0001982143 (7.858 sec)
INFO:tensorflow:global_step/sec: 13.0388
INFO:tensorflow:loss = 1.254819, step = 69960 (7.666 sec)
INFO:tensorflow:lr = 0.00019801517 (7.665 sec)
INFO:tensorflow:global_step/sec: 12.7131
INFO:tensorflow:loss = 1.2549182, step = 70060 (7.867 sec)
INFO:tensorflow:lr = 0.00019781626 (7.868 sec)
INFO:tensorflow:global_step/sec: 12.6675
INFO:tensorflow:loss = 1.2597824, step = 70160 (7.890 sec)
INFO:tensorflow:lr = 0.00019761756 (7.892 sec)
INFO:tensorflow:global_step/sec: 13.1409
INFO:tensorflow:loss = 1.2613363, step = 70260 (7.612 sec)
INFO:tensorflow:lr = 0.00019741904 (7.611 sec)
INFO:tensorflow:global_step/sec: 12.9385
INFO:tensorflow:loss = 1.2608613, step = 70360 (7.732 sec)
INFO:tensorflow:lr = 0.00019722072 (7.731 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.20857
INFO:tensorflow:loss = 1.2632818, step = 70460 (12.177 sec)
INFO:tensorflow:lr = 0.0001970226 (12.180 sec)
INFO:tensorflow:global_step/sec: 12.7764
INFO:tensorflow:loss = 1.2565051, step = 70560 (7.830 sec)
INFO:tensorflow:lr = 0.0001968247 (7.829 sec)
INFO:tensorflow:global_step/sec: 12.8345
INFO:tensorflow:loss = 1.2527218, step = 70660 (7.791 sec)
INFO:tensorflow:lr = 0.00019662696 (7.791 sec)
INFO:tensorflow:global_step/sec: 12.5946
INFO:tensorflow:loss = 1.2486485, step = 70760 (7.944 sec)
INFO:tensorflow:lr = 0.00019642948 (7.941 sec)
INFO:tensorflow:global_step/sec: 12.8962
INFO:tensorflow:loss = 1.2574401, step = 70860 (7.755 sec)
INFO:tensorflow:lr = 0.00019623214 (7.755 sec)
INFO:tensorflow:global_step/sec: 12.8522
INFO:tensorflow:loss = 1.2536379, step = 70960 (7.778 sec)
INFO:tensorflow:lr = 0.000196035 (7.781 sec)
INFO:tensorflow:global_step/sec: 12.8556
INFO:tensorflow:loss = 1.253561, step = 71060 (7.776 sec)
INFO:tensorflow:lr = 0.0001958381 (7.774 sec)
INFO:tensorflow:global_step/sec: 12.6452
INFO:tensorflow:loss = 1.2638847, step = 71160 (7.909 sec)
INFO:tensorflow:lr = 0.00019564138 (7.908 sec)
INFO:tensorflow:global_step/sec: 12.881
INFO:tensorflow:loss = 1.2507195, step = 71260 (7.769 sec)
INFO:tensorflow:lr = 0.00019544485 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.9177
INFO:tensorflow:loss = 1.2516303, step = 71360 (7.740 sec)
INFO:tensorflow:lr = 0.00019524853 (7.740 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.34864
INFO:tensorflow:loss = 1.2554841, step = 71460 (11.978 sec)
INFO:tensorflow:lr = 0.00019505239 (11.978 sec)
INFO:tensorflow:global_step/sec: 12.7332
INFO:tensorflow:loss = 1.2557956, step = 71560 (7.848 sec)
INFO:tensorflow:lr = 0.00019485643 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.8162
INFO:tensorflow:loss = 1.2516918, step = 71660 (7.802 sec)
INFO:tensorflow:lr = 0.00019466071 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.5072
INFO:tensorflow:loss = 1.2480005, step = 71760 (7.999 sec)
INFO:tensorflow:lr = 0.00019446517 (7.998 sec)
INFO:tensorflow:global_step/sec: 12.9678
INFO:tensorflow:loss = 1.2523248, step = 71860 (7.710 sec)
INFO:tensorflow:lr = 0.00019426983 (7.712 sec)
INFO:tensorflow:global_step/sec: 12.5132
INFO:tensorflow:loss = 1.2603774, step = 71960 (7.989 sec)
INFO:tensorflow:lr = 0.00019407466 (7.988 sec)
INFO:tensorflow:global_step/sec: 12.3631
INFO:tensorflow:loss = 1.2541709, step = 72060 (8.090 sec)
INFO:tensorflow:lr = 0.00019387972 (8.092 sec)
INFO:tensorflow:global_step/sec: 12.7245
INFO:tensorflow:loss = 1.2525417, step = 72160 (7.862 sec)
INFO:tensorflow:lr = 0.00019368496 (7.862 sec)
INFO:tensorflow:global_step/sec: 12.4976
INFO:tensorflow:loss = 1.2616658, step = 72260 (8.004 sec)
INFO:tensorflow:lr = 0.0001934904 (8.003 sec)
INFO:tensorflow:global_step/sec: 12.9216
INFO:tensorflow:loss = 1.2619153, step = 72360 (7.735 sec)
INFO:tensorflow:lr = 0.00019329603 (7.735 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.33511
INFO:tensorflow:loss = 1.2601154, step = 72460 (12.002 sec)
INFO:tensorflow:lr = 0.00019310186 (12.001 sec)
INFO:tensorflow:global_step/sec: 13.1451
INFO:tensorflow:loss = 1.251988, step = 72560 (7.604 sec)
INFO:tensorflow:lr = 0.00019290789 (7.604 sec)
INFO:tensorflow:global_step/sec: 12.6733
INFO:tensorflow:loss = 1.2546278, step = 72660 (7.888 sec)
INFO:tensorflow:lr = 0.0001927141 (7.888 sec)
INFO:tensorflow:global_step/sec: 12.3631
INFO:tensorflow:loss = 1.2519424, step = 72760 (8.088 sec)
INFO:tensorflow:lr = 0.00019252051 (8.088 sec)
INFO:tensorflow:global_step/sec: 12.6768
INFO:tensorflow:loss = 1.2527174, step = 72860 (7.889 sec)
INFO:tensorflow:lr = 0.00019232712 (7.889 sec)
INFO:tensorflow:global_step/sec: 12.743
INFO:tensorflow:loss = 1.2503885, step = 72960 (7.847 sec)
INFO:tensorflow:lr = 0.00019213393 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.433
INFO:tensorflow:loss = 1.2566782, step = 73060 (8.046 sec)
INFO:tensorflow:lr = 0.00019194091 (8.046 sec)
INFO:tensorflow:global_step/sec: 12.7119
INFO:tensorflow:loss = 1.2558047, step = 73160 (7.867 sec)
INFO:tensorflow:lr = 0.00019174813 (7.867 sec)
INFO:tensorflow:global_step/sec: 12.8101
INFO:tensorflow:loss = 1.2558652, step = 73260 (7.804 sec)
INFO:tensorflow:lr = 0.00019155549 (7.805 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.79918
INFO:tensorflow:loss = 1.2639738, step = 73360 (11.364 sec)
INFO:tensorflow:lr = 0.0001913631 (11.362 sec)
INFO:tensorflow:global_step/sec: 12.6976
INFO:tensorflow:loss = 1.2517492, step = 73460 (7.876 sec)
INFO:tensorflow:lr = 0.00019117084 (7.876 sec)
INFO:tensorflow:global_step/sec: 12.6726
INFO:tensorflow:loss = 1.2523484, step = 73560 (7.896 sec)
INFO:tensorflow:lr = 0.00019097881 (7.897 sec)
INFO:tensorflow:global_step/sec: 12.6952
INFO:tensorflow:loss = 1.250717, step = 73660 (7.871 sec)
INFO:tensorflow:lr = 0.00019078696 (7.871 sec)
INFO:tensorflow:global_step/sec: 12.9998
INFO:tensorflow:loss = 1.2526314, step = 73760 (7.693 sec)
INFO:tensorflow:lr = 0.00019059531 (7.694 sec)
INFO:tensorflow:global_step/sec: 12.9429
INFO:tensorflow:loss = 1.2553871, step = 73860 (7.726 sec)
INFO:tensorflow:lr = 0.00019040387 (7.728 sec)
INFO:tensorflow:global_step/sec: 12.7098
INFO:tensorflow:loss = 1.2495402, step = 73960 (7.873 sec)
INFO:tensorflow:lr = 0.00019021258 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.7847
INFO:tensorflow:loss = 1.2583013, step = 74060 (7.818 sec)
INFO:tensorflow:lr = 0.00019002153 (7.820 sec)
INFO:tensorflow:global_step/sec: 12.606
INFO:tensorflow:loss = 1.2551463, step = 74160 (7.933 sec)
INFO:tensorflow:lr = 0.00018983062 (7.936 sec)
INFO:tensorflow:global_step/sec: 12.569
INFO:tensorflow:loss = 1.2499317, step = 74260 (7.961 sec)
INFO:tensorflow:lr = 0.00018963996 (7.956 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.31888
INFO:tensorflow:loss = 1.2556055, step = 74360 (10.732 sec)
INFO:tensorflow:lr = 0.00018944943 (10.731 sec)
INFO:tensorflow:global_step/sec: 12.5155
INFO:tensorflow:loss = 1.2517197, step = 74460 (7.990 sec)
INFO:tensorflow:lr = 0.00018925912 (7.991 sec)
INFO:tensorflow:global_step/sec: 12.8288
INFO:tensorflow:loss = 1.2531888, step = 74560 (7.789 sec)
INFO:tensorflow:lr = 0.00018906903 (7.788 sec)
INFO:tensorflow:global_step/sec: 12.5171
INFO:tensorflow:loss = 1.2516396, step = 74660 (7.989 sec)
INFO:tensorflow:lr = 0.0001888791 (7.993 sec)
INFO:tensorflow:global_step/sec: 12.7424
INFO:tensorflow:loss = 1.2480764, step = 74760 (7.848 sec)
INFO:tensorflow:lr = 0.00018868937 (7.844 sec)
INFO:tensorflow:global_step/sec: 12.5514
INFO:tensorflow:loss = 1.2534533, step = 74860 (7.970 sec)
INFO:tensorflow:lr = 0.00018849983 (7.970 sec)
INFO:tensorflow:global_step/sec: 12.8268
INFO:tensorflow:loss = 1.2513977, step = 74960 (7.800 sec)
INFO:tensorflow:lr = 0.00018831047 (7.799 sec)
INFO:tensorflow:global_step/sec: 12.8144
INFO:tensorflow:loss = 1.2506344, step = 75060 (7.798 sec)
INFO:tensorflow:lr = 0.0001881213 (7.802 sec)
INFO:tensorflow:global_step/sec: 12.7008
INFO:tensorflow:loss = 1.2517682, step = 75160 (7.874 sec)
INFO:tensorflow:lr = 0.00018793234 (7.872 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2503
INFO:tensorflow:loss = 1.2574689, step = 75260 (8.171 sec)
INFO:tensorflow:lr = 0.00018774354 (8.176 sec)
INFO:tensorflow:global_step/sec: 10.6335
INFO:tensorflow:loss = 1.26586, step = 75360 (9.400 sec)
INFO:tensorflow:lr = 0.00018755496 (9.393 sec)
INFO:tensorflow:global_step/sec: 12.973
INFO:tensorflow:loss = 1.2528296, step = 75460 (7.707 sec)
INFO:tensorflow:lr = 0.00018736653 (7.709 sec)
INFO:tensorflow:global_step/sec: 12.2656
INFO:tensorflow:loss = 1.2583458, step = 75560 (8.154 sec)
INFO:tensorflow:lr = 0.00018717833 (8.153 sec)
INFO:tensorflow:global_step/sec: 12.8809
INFO:tensorflow:loss = 1.2474772, step = 75660 (7.759 sec)
INFO:tensorflow:lr = 0.00018699029 (7.763 sec)
INFO:tensorflow:global_step/sec: 12.8353
INFO:tensorflow:loss = 1.2567656, step = 75760 (7.796 sec)
INFO:tensorflow:lr = 0.00018680248 (7.791 sec)
INFO:tensorflow:global_step/sec: 12.8607
INFO:tensorflow:loss = 1.2529895, step = 75860 (7.776 sec)
INFO:tensorflow:lr = 0.00018661484 (7.777 sec)
INFO:tensorflow:global_step/sec: 12.4908
INFO:tensorflow:loss = 1.255029, step = 75960 (8.005 sec)
INFO:tensorflow:lr = 0.00018642735 (8.006 sec)
INFO:tensorflow:global_step/sec: 12.4031
INFO:tensorflow:loss = 1.2508453, step = 76060 (8.062 sec)
INFO:tensorflow:lr = 0.00018624008 (8.060 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2921
INFO:tensorflow:loss = 1.2630798, step = 76160 (8.134 sec)
INFO:tensorflow:lr = 0.000186053 (8.136 sec)
INFO:tensorflow:global_step/sec: 10.9934
INFO:tensorflow:loss = 1.255268, step = 76260 (9.093 sec)
INFO:tensorflow:lr = 0.00018586611 (9.093 sec)
INFO:tensorflow:global_step/sec: 12.8284
INFO:tensorflow:loss = 1.2487235, step = 76360 (7.795 sec)
INFO:tensorflow:lr = 0.00018567941 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.6785
INFO:tensorflow:loss = 1.2549771, step = 76460 (7.893 sec)
INFO:tensorflow:lr = 0.0001854929 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.5547
INFO:tensorflow:loss = 1.256425, step = 76560 (7.963 sec)
INFO:tensorflow:lr = 0.00018530655 (7.964 sec)
INFO:tensorflow:global_step/sec: 12.5549
INFO:tensorflow:loss = 1.2490952, step = 76660 (7.962 sec)
INFO:tensorflow:lr = 0.00018512041 (7.961 sec)
INFO:tensorflow:global_step/sec: 12.831
INFO:tensorflow:loss = 1.2511157, step = 76760 (7.792 sec)
INFO:tensorflow:lr = 0.00018493446 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.6078
INFO:tensorflow:loss = 1.2497431, step = 76860 (7.937 sec)
INFO:tensorflow:lr = 0.00018474869 (7.938 sec)
INFO:tensorflow:global_step/sec: 12.6514
INFO:tensorflow:loss = 1.2566417, step = 76960 (7.902 sec)
INFO:tensorflow:lr = 0.00018456309 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.9655
INFO:tensorflow:loss = 1.2616142, step = 77060 (7.713 sec)
INFO:tensorflow:lr = 0.00018437768 (7.715 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.9968
INFO:tensorflow:loss = 1.2498459, step = 77160 (8.342 sec)
INFO:tensorflow:lr = 0.00018419247 (8.347 sec)
INFO:tensorflow:global_step/sec: 11.3735
INFO:tensorflow:loss = 1.2483019, step = 77260 (8.789 sec)
INFO:tensorflow:lr = 0.00018400745 (8.781 sec)
INFO:tensorflow:global_step/sec: 12.7229
INFO:tensorflow:loss = 1.2514182, step = 77360 (7.857 sec)
INFO:tensorflow:lr = 0.00018382262 (7.858 sec)
INFO:tensorflow:global_step/sec: 12.6732
INFO:tensorflow:loss = 1.2530181, step = 77460 (7.893 sec)
INFO:tensorflow:lr = 0.00018363795 (7.894 sec)
INFO:tensorflow:global_step/sec: 12.605
INFO:tensorflow:loss = 1.2535021, step = 77560 (7.931 sec)
INFO:tensorflow:lr = 0.00018345349 (7.930 sec)
INFO:tensorflow:global_step/sec: 12.9194
INFO:tensorflow:loss = 1.2538028, step = 77660 (7.743 sec)
INFO:tensorflow:lr = 0.00018326919 (7.742 sec)
INFO:tensorflow:global_step/sec: 12.62
INFO:tensorflow:loss = 1.2521385, step = 77760 (7.923 sec)
INFO:tensorflow:lr = 0.00018308511 (7.923 sec)
INFO:tensorflow:global_step/sec: 12.8095
INFO:tensorflow:loss = 1.252689, step = 77860 (7.806 sec)
INFO:tensorflow:lr = 0.0001829012 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.977
INFO:tensorflow:loss = 1.2580132, step = 77960 (7.707 sec)
INFO:tensorflow:lr = 0.00018271746 (7.707 sec)
INFO:tensorflow:global_step/sec: 12.992
INFO:tensorflow:loss = 1.2574784, step = 78060 (7.695 sec)
INFO:tensorflow:lr = 0.00018253391 (7.695 sec)
INFO:tensorflow:global_step/sec: 12.6106
INFO:tensorflow:loss = 1.2529795, step = 78160 (7.931 sec)
INFO:tensorflow:lr = 0.00018235056 (7.930 sec)
INFO:tensorflow:Saving checkpoints for 78240 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2499174.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-78240
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-78240
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.717
INFO:tensorflow:Best (Exact Match) Accuracy: 0.717
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-78240
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 78240 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2590173, step = 78240
INFO:tensorflow:lr = 0.000182204
INFO:tensorflow:global_step/sec: 10.2335
INFO:tensorflow:loss = 1.2496594, step = 78340 (9.780 sec)
INFO:tensorflow:lr = 0.00018202097 (9.780 sec)
INFO:tensorflow:global_step/sec: 12.6641
INFO:tensorflow:loss = 1.2591709, step = 78440 (7.896 sec)
INFO:tensorflow:lr = 0.00018183814 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.8297
INFO:tensorflow:loss = 1.2547472, step = 78540 (7.788 sec)
INFO:tensorflow:lr = 0.00018165546 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.8503
INFO:tensorflow:loss = 1.2477771, step = 78640 (7.788 sec)
INFO:tensorflow:lr = 0.00018147299 (7.785 sec)
INFO:tensorflow:global_step/sec: 12.4826
INFO:tensorflow:loss = 1.250107, step = 78740 (8.005 sec)
INFO:tensorflow:lr = 0.0001812907 (8.005 sec)
INFO:tensorflow:global_step/sec: 12.6461
INFO:tensorflow:loss = 1.2553511, step = 78840 (7.909 sec)
INFO:tensorflow:lr = 0.00018110858 (7.909 sec)
INFO:tensorflow:global_step/sec: 12.8929
INFO:tensorflow:loss = 1.2516081, step = 78940 (7.762 sec)
INFO:tensorflow:lr = 0.00018092665 (7.763 sec)
INFO:tensorflow:global_step/sec: 12.6101
INFO:tensorflow:loss = 1.2541536, step = 79040 (7.927 sec)
INFO:tensorflow:lr = 0.00018074492 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.4696
INFO:tensorflow:loss = 1.2553225, step = 79140 (8.015 sec)
INFO:tensorflow:lr = 0.00018056334 (8.015 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.35453
INFO:tensorflow:loss = 1.2502196, step = 79240 (11.971 sec)
INFO:tensorflow:lr = 0.00018038196 (11.971 sec)
INFO:tensorflow:global_step/sec: 12.639
INFO:tensorflow:loss = 1.2486528, step = 79340 (7.912 sec)
INFO:tensorflow:lr = 0.00018020078 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.694
INFO:tensorflow:loss = 1.248358, step = 79440 (7.883 sec)
INFO:tensorflow:lr = 0.00018001975 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.6918
INFO:tensorflow:loss = 1.2552594, step = 79540 (7.873 sec)
INFO:tensorflow:lr = 0.00017983893 (7.873 sec)
INFO:tensorflow:global_step/sec: 12.7387
INFO:tensorflow:loss = 1.2540479, step = 79640 (7.857 sec)
INFO:tensorflow:lr = 0.00017965824 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.7917
INFO:tensorflow:loss = 1.2457458, step = 79740 (7.811 sec)
INFO:tensorflow:lr = 0.00017947779 (7.805 sec)
INFO:tensorflow:global_step/sec: 12.4802
INFO:tensorflow:loss = 1.2563258, step = 79840 (8.015 sec)
INFO:tensorflow:lr = 0.0001792975 (8.016 sec)
INFO:tensorflow:global_step/sec: 12.8425
INFO:tensorflow:loss = 1.2508807, step = 79940 (7.790 sec)
INFO:tensorflow:lr = 0.0001791174 (7.789 sec)
INFO:tensorflow:global_step/sec: 12.7452
INFO:tensorflow:loss = 1.2514696, step = 80040 (7.845 sec)
INFO:tensorflow:lr = 0.00017893747 (7.844 sec)
INFO:tensorflow:global_step/sec: 12.8878
INFO:tensorflow:loss = 1.2509739, step = 80140 (7.755 sec)
INFO:tensorflow:lr = 0.0001787577 (7.757 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.38154
INFO:tensorflow:loss = 1.2584447, step = 80240 (11.935 sec)
INFO:tensorflow:lr = 0.00017857815 (11.934 sec)
INFO:tensorflow:global_step/sec: 12.6567
INFO:tensorflow:loss = 1.2512501, step = 80340 (7.896 sec)
INFO:tensorflow:lr = 0.00017839875 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.7351
INFO:tensorflow:loss = 1.2498204, step = 80440 (7.853 sec)
INFO:tensorflow:lr = 0.00017821955 (7.850 sec)
INFO:tensorflow:global_step/sec: 12.8998
INFO:tensorflow:loss = 1.254194, step = 80540 (7.757 sec)
INFO:tensorflow:lr = 0.00017804053 (7.756 sec)
INFO:tensorflow:global_step/sec: 12.6751
INFO:tensorflow:loss = 1.2590884, step = 80640 (7.887 sec)
INFO:tensorflow:lr = 0.00017786169 (7.889 sec)
INFO:tensorflow:global_step/sec: 12.8078
INFO:tensorflow:loss = 1.2537712, step = 80740 (7.811 sec)
INFO:tensorflow:lr = 0.000177683 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.8097
INFO:tensorflow:loss = 1.2545077, step = 80840 (7.800 sec)
INFO:tensorflow:lr = 0.00017750452 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.8288
INFO:tensorflow:loss = 1.24793, step = 80940 (7.794 sec)
INFO:tensorflow:lr = 0.00017732622 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.9341
INFO:tensorflow:loss = 1.2493593, step = 81040 (7.732 sec)
INFO:tensorflow:lr = 0.00017714809 (7.731 sec)
INFO:tensorflow:global_step/sec: 12.6921
INFO:tensorflow:loss = 1.2523218, step = 81140 (7.879 sec)
INFO:tensorflow:lr = 0.00017697013 (7.880 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.29548
INFO:tensorflow:loss = 1.2478547, step = 81240 (12.054 sec)
INFO:tensorflow:lr = 0.00017679235 (12.054 sec)
INFO:tensorflow:global_step/sec: 12.8312
INFO:tensorflow:loss = 1.2478245, step = 81340 (7.797 sec)
INFO:tensorflow:lr = 0.00017661476 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.5046
INFO:tensorflow:loss = 1.2513237, step = 81440 (7.999 sec)
INFO:tensorflow:lr = 0.00017643734 (7.999 sec)
INFO:tensorflow:global_step/sec: 13.0428
INFO:tensorflow:loss = 1.2500213, step = 81540 (7.664 sec)
INFO:tensorflow:lr = 0.00017626012 (7.665 sec)
INFO:tensorflow:global_step/sec: 12.8603
INFO:tensorflow:loss = 1.2503232, step = 81640 (7.774 sec)
INFO:tensorflow:lr = 0.00017608305 (7.772 sec)
INFO:tensorflow:global_step/sec: 12.8574
INFO:tensorflow:loss = 1.2482414, step = 81740 (7.781 sec)
INFO:tensorflow:lr = 0.00017590619 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.2935
INFO:tensorflow:loss = 1.2473918, step = 81840 (8.131 sec)
INFO:tensorflow:lr = 0.00017572947 (8.131 sec)
INFO:tensorflow:global_step/sec: 12.9845
INFO:tensorflow:loss = 1.2510718, step = 81940 (7.701 sec)
INFO:tensorflow:lr = 0.00017555297 (7.702 sec)
INFO:tensorflow:global_step/sec: 12.6733
INFO:tensorflow:loss = 1.2469774, step = 82040 (7.891 sec)
INFO:tensorflow:lr = 0.00017537661 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.6176
INFO:tensorflow:loss = 1.2501423, step = 82140 (7.925 sec)
INFO:tensorflow:lr = 0.00017520043 (7.928 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.49764
INFO:tensorflow:loss = 1.2507443, step = 82240 (11.768 sec)
INFO:tensorflow:lr = 0.00017502444 (11.764 sec)
INFO:tensorflow:global_step/sec: 12.5804
INFO:tensorflow:loss = 1.2484735, step = 82340 (7.952 sec)
INFO:tensorflow:lr = 0.00017484862 (7.953 sec)
INFO:tensorflow:global_step/sec: 13.0737
INFO:tensorflow:loss = 1.250423, step = 82440 (7.648 sec)
INFO:tensorflow:lr = 0.000174673 (7.648 sec)
INFO:tensorflow:global_step/sec: 12.6908
INFO:tensorflow:loss = 1.2670717, step = 82540 (7.882 sec)
INFO:tensorflow:lr = 0.00017449753 (7.882 sec)
INFO:tensorflow:global_step/sec: 12.838
INFO:tensorflow:loss = 1.249461, step = 82640 (7.791 sec)
INFO:tensorflow:lr = 0.00017432224 (7.793 sec)
INFO:tensorflow:global_step/sec: 12.7286
INFO:tensorflow:loss = 1.2500602, step = 82740 (7.849 sec)
INFO:tensorflow:lr = 0.0001741471 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.8635
INFO:tensorflow:loss = 1.250238, step = 82840 (7.776 sec)
INFO:tensorflow:lr = 0.00017397219 (7.778 sec)
INFO:tensorflow:global_step/sec: 12.5899
INFO:tensorflow:loss = 1.2476375, step = 82940 (7.945 sec)
INFO:tensorflow:lr = 0.00017379744 (7.943 sec)
INFO:tensorflow:global_step/sec: 12.8872
INFO:tensorflow:loss = 1.2561243, step = 83040 (7.760 sec)
INFO:tensorflow:lr = 0.00017362286 (7.760 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.60542
INFO:tensorflow:loss = 1.249593, step = 83140 (11.621 sec)
INFO:tensorflow:lr = 0.00017344844 (11.621 sec)
INFO:tensorflow:global_step/sec: 13.0203
INFO:tensorflow:loss = 1.2486179, step = 83240 (7.676 sec)
INFO:tensorflow:lr = 0.00017327421 (7.676 sec)
INFO:tensorflow:global_step/sec: 12.5732
INFO:tensorflow:loss = 1.2553233, step = 83340 (7.958 sec)
INFO:tensorflow:lr = 0.00017310014 (7.959 sec)
INFO:tensorflow:global_step/sec: 12.7835
INFO:tensorflow:loss = 1.2564698, step = 83440 (7.822 sec)
INFO:tensorflow:lr = 0.00017292627 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.9991
INFO:tensorflow:loss = 1.2600302, step = 83540 (7.694 sec)
INFO:tensorflow:lr = 0.00017275255 (7.694 sec)
INFO:tensorflow:global_step/sec: 12.6979
INFO:tensorflow:loss = 1.2510674, step = 83640 (7.870 sec)
INFO:tensorflow:lr = 0.000172579 (7.873 sec)
INFO:tensorflow:global_step/sec: 12.7094
INFO:tensorflow:loss = 1.2540224, step = 83740 (7.869 sec)
INFO:tensorflow:lr = 0.00017240565 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.7121
INFO:tensorflow:loss = 1.2510121, step = 83840 (7.869 sec)
INFO:tensorflow:lr = 0.00017223245 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.6853
INFO:tensorflow:loss = 1.2614245, step = 83940 (7.885 sec)
INFO:tensorflow:lr = 0.00017205944 (7.884 sec)
INFO:tensorflow:global_step/sec: 12.7461
INFO:tensorflow:loss = 1.2500675, step = 84040 (7.844 sec)
INFO:tensorflow:lr = 0.00017188663 (7.847 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.15836
INFO:tensorflow:loss = 1.259658, step = 84140 (10.922 sec)
INFO:tensorflow:lr = 0.00017171395 (10.920 sec)
INFO:tensorflow:global_step/sec: 13.0493
INFO:tensorflow:loss = 1.2597753, step = 84240 (7.659 sec)
INFO:tensorflow:lr = 0.00017154145 (7.658 sec)
INFO:tensorflow:global_step/sec: 12.8351
INFO:tensorflow:loss = 1.2478659, step = 84340 (7.792 sec)
INFO:tensorflow:lr = 0.00017136915 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.6189
INFO:tensorflow:loss = 1.2543241, step = 84440 (7.923 sec)
INFO:tensorflow:lr = 0.00017119701 (7.922 sec)
INFO:tensorflow:global_step/sec: 12.8493
INFO:tensorflow:loss = 1.2495148, step = 84540 (7.783 sec)
INFO:tensorflow:lr = 0.00017102502 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.5098
INFO:tensorflow:loss = 1.2590244, step = 84640 (7.998 sec)
INFO:tensorflow:lr = 0.00017085322 (7.995 sec)
INFO:tensorflow:global_step/sec: 12.8627
INFO:tensorflow:loss = 1.2492456, step = 84740 (7.770 sec)
INFO:tensorflow:lr = 0.0001706816 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.8319
INFO:tensorflow:loss = 1.2496346, step = 84840 (7.796 sec)
INFO:tensorflow:lr = 0.00017051013 (7.797 sec)
INFO:tensorflow:global_step/sec: 12.6574
INFO:tensorflow:loss = 1.2487538, step = 84940 (7.898 sec)
INFO:tensorflow:lr = 0.00017033887 (7.901 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.3381
INFO:tensorflow:loss = 1.2556379, step = 85040 (8.113 sec)
INFO:tensorflow:lr = 0.00017016775 (8.114 sec)
INFO:tensorflow:global_step/sec: 10.7431
INFO:tensorflow:loss = 1.2477072, step = 85140 (9.305 sec)
INFO:tensorflow:lr = 0.00016999681 (9.300 sec)
INFO:tensorflow:global_step/sec: 13.1212
INFO:tensorflow:loss = 1.2478539, step = 85240 (7.621 sec)
INFO:tensorflow:lr = 0.00016982605 (7.625 sec)
INFO:tensorflow:global_step/sec: 13.0129
INFO:tensorflow:loss = 1.2585075, step = 85340 (7.680 sec)
INFO:tensorflow:lr = 0.00016965547 (7.676 sec)
INFO:tensorflow:global_step/sec: 12.9017
INFO:tensorflow:loss = 1.2566411, step = 85440 (7.750 sec)
INFO:tensorflow:lr = 0.00016948502 (7.750 sec)
INFO:tensorflow:global_step/sec: 12.7359
INFO:tensorflow:loss = 1.2534791, step = 85540 (7.857 sec)
INFO:tensorflow:lr = 0.00016931478 (7.858 sec)
INFO:tensorflow:global_step/sec: 12.2424
INFO:tensorflow:loss = 1.2601684, step = 85640 (8.168 sec)
INFO:tensorflow:lr = 0.00016914468 (8.168 sec)
INFO:tensorflow:global_step/sec: 12.5107
INFO:tensorflow:loss = 1.2539284, step = 85740 (7.995 sec)
INFO:tensorflow:lr = 0.00016897477 (7.995 sec)
INFO:tensorflow:global_step/sec: 12.9542
INFO:tensorflow:loss = 1.2505609, step = 85840 (7.713 sec)
INFO:tensorflow:lr = 0.00016880504 (7.712 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.6341
INFO:tensorflow:loss = 1.2487622, step = 85940 (7.922 sec)
INFO:tensorflow:lr = 0.00016863547 (7.923 sec)
INFO:tensorflow:global_step/sec: 10.8304
INFO:tensorflow:loss = 1.2539859, step = 86040 (9.231 sec)
INFO:tensorflow:lr = 0.00016846608 (9.230 sec)
INFO:tensorflow:global_step/sec: 12.7512
INFO:tensorflow:loss = 1.2534391, step = 86140 (7.844 sec)
INFO:tensorflow:lr = 0.00016829684 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.7686
INFO:tensorflow:loss = 1.2543765, step = 86240 (7.829 sec)
INFO:tensorflow:lr = 0.00016812778 (7.827 sec)
INFO:tensorflow:global_step/sec: 12.956
INFO:tensorflow:loss = 1.2502369, step = 86340 (7.719 sec)
INFO:tensorflow:lr = 0.00016795889 (7.719 sec)
INFO:tensorflow:global_step/sec: 12.8613
INFO:tensorflow:loss = 1.2478958, step = 86440 (7.771 sec)
INFO:tensorflow:lr = 0.00016779019 (7.772 sec)
INFO:tensorflow:global_step/sec: 13.1076
INFO:tensorflow:loss = 1.2502476, step = 86540 (7.628 sec)
INFO:tensorflow:lr = 0.00016762162 (7.635 sec)
INFO:tensorflow:global_step/sec: 12.6676
INFO:tensorflow:loss = 1.2501, step = 86640 (7.895 sec)
INFO:tensorflow:lr = 0.00016745325 (7.888 sec)
INFO:tensorflow:global_step/sec: 12.7157
INFO:tensorflow:loss = 1.2478064, step = 86740 (7.863 sec)
INFO:tensorflow:lr = 0.00016728503 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.7067
INFO:tensorflow:loss = 1.2639413, step = 86840 (7.870 sec)
INFO:tensorflow:lr = 0.00016711699 (7.874 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0525
INFO:tensorflow:loss = 1.252271, step = 86940 (8.303 sec)
INFO:tensorflow:lr = 0.00016694913 (8.304 sec)
INFO:tensorflow:global_step/sec: 11.429
INFO:tensorflow:loss = 1.252577, step = 87040 (8.749 sec)
INFO:tensorflow:lr = 0.0001667814 (8.743 sec)
INFO:tensorflow:global_step/sec: 12.8618
INFO:tensorflow:loss = 1.2451332, step = 87140 (7.772 sec)
INFO:tensorflow:lr = 0.00016661389 (7.774 sec)
INFO:tensorflow:global_step/sec: 13.0815
INFO:tensorflow:loss = 1.250391, step = 87240 (7.649 sec)
INFO:tensorflow:lr = 0.00016644651 (7.649 sec)
INFO:tensorflow:global_step/sec: 12.8
INFO:tensorflow:loss = 1.250594, step = 87340 (7.811 sec)
INFO:tensorflow:lr = 0.00016627931 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.9375
INFO:tensorflow:loss = 1.2503841, step = 87440 (7.726 sec)
INFO:tensorflow:lr = 0.00016611228 (7.727 sec)
INFO:tensorflow:global_step/sec: 12.8328
INFO:tensorflow:loss = 1.2486295, step = 87540 (7.795 sec)
INFO:tensorflow:lr = 0.00016594543 (7.794 sec)
INFO:tensorflow:global_step/sec: 12.5163
INFO:tensorflow:loss = 1.2504075, step = 87640 (7.985 sec)
INFO:tensorflow:lr = 0.00016577872 (7.989 sec)
INFO:tensorflow:global_step/sec: 13.0312
INFO:tensorflow:loss = 1.2518604, step = 87740 (7.674 sec)
INFO:tensorflow:lr = 0.00016561219 (7.671 sec)
INFO:tensorflow:global_step/sec: 12.6941
INFO:tensorflow:loss = 1.2477338, step = 87840 (7.878 sec)
INFO:tensorflow:lr = 0.00016544582 (7.878 sec)
INFO:tensorflow:global_step/sec: 12.3306
INFO:tensorflow:loss = 1.2489831, step = 87940 (8.110 sec)
INFO:tensorflow:lr = 0.00016527963 (8.109 sec)
INFO:tensorflow:Saving checkpoints for 88020 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2430813.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-88020
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-88020
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.721
INFO:tensorflow:Best (Exact Match) Accuracy: 0.721
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-88020
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 88020 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2478541, step = 88020
INFO:tensorflow:lr = 0.00016514679
INFO:tensorflow:global_step/sec: 10.07
INFO:tensorflow:loss = 1.2509733, step = 88120 (9.934 sec)
INFO:tensorflow:lr = 0.0001649809 (9.935 sec)
INFO:tensorflow:global_step/sec: 12.5025
INFO:tensorflow:loss = 1.249775, step = 88220 (7.999 sec)
INFO:tensorflow:lr = 0.00016481518 (7.996 sec)
INFO:tensorflow:global_step/sec: 12.7872
INFO:tensorflow:loss = 1.2507293, step = 88320 (7.825 sec)
INFO:tensorflow:lr = 0.00016464961 (7.831 sec)
INFO:tensorflow:global_step/sec: 12.7513
INFO:tensorflow:loss = 1.2496305, step = 88420 (7.836 sec)
INFO:tensorflow:lr = 0.00016448423 (7.834 sec)
INFO:tensorflow:global_step/sec: 12.9031
INFO:tensorflow:loss = 1.2485484, step = 88520 (7.751 sec)
INFO:tensorflow:lr = 0.00016431899 (7.748 sec)
INFO:tensorflow:global_step/sec: 12.803
INFO:tensorflow:loss = 1.2538512, step = 88620 (7.814 sec)
INFO:tensorflow:lr = 0.00016415393 (7.814 sec)
INFO:tensorflow:global_step/sec: 12.4804
INFO:tensorflow:loss = 1.2560003, step = 88720 (8.008 sec)
INFO:tensorflow:lr = 0.00016398903 (8.010 sec)
INFO:tensorflow:global_step/sec: 12.8263
INFO:tensorflow:loss = 1.2487856, step = 88820 (7.796 sec)
INFO:tensorflow:lr = 0.0001638243 (7.794 sec)
INFO:tensorflow:global_step/sec: 12.9732
INFO:tensorflow:loss = 1.2564486, step = 88920 (7.708 sec)
INFO:tensorflow:lr = 0.00016365973 (7.708 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.3463
INFO:tensorflow:loss = 1.248512, step = 89020 (11.987 sec)
INFO:tensorflow:lr = 0.00016349532 (11.987 sec)
INFO:tensorflow:global_step/sec: 12.8714
INFO:tensorflow:loss = 1.2499951, step = 89120 (7.770 sec)
INFO:tensorflow:lr = 0.0001633311 (7.771 sec)
INFO:tensorflow:global_step/sec: 12.754
INFO:tensorflow:loss = 1.2510864, step = 89220 (7.839 sec)
INFO:tensorflow:lr = 0.00016316702 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.7582
INFO:tensorflow:loss = 1.2505963, step = 89320 (7.835 sec)
INFO:tensorflow:lr = 0.00016300312 (7.836 sec)
INFO:tensorflow:global_step/sec: 12.6331
INFO:tensorflow:loss = 1.2495183, step = 89420 (7.915 sec)
INFO:tensorflow:lr = 0.00016283937 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.6353
INFO:tensorflow:loss = 1.250917, step = 89520 (7.914 sec)
INFO:tensorflow:lr = 0.0001626758 (7.917 sec)
INFO:tensorflow:global_step/sec: 12.993
INFO:tensorflow:loss = 1.2484233, step = 89620 (7.699 sec)
INFO:tensorflow:lr = 0.0001625124 (7.696 sec)
INFO:tensorflow:global_step/sec: 12.8745
INFO:tensorflow:loss = 1.2567275, step = 89720 (7.770 sec)
INFO:tensorflow:lr = 0.00016234916 (7.770 sec)
INFO:tensorflow:global_step/sec: 12.7192
INFO:tensorflow:loss = 1.2655329, step = 89820 (7.862 sec)
INFO:tensorflow:lr = 0.00016218606 (7.862 sec)
INFO:tensorflow:global_step/sec: 12.7579
INFO:tensorflow:loss = 1.2497483, step = 89920 (7.833 sec)
INFO:tensorflow:lr = 0.00016202313 (7.834 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.35646
INFO:tensorflow:loss = 1.2529335, step = 90020 (11.966 sec)
INFO:tensorflow:lr = 0.00016186039 (11.965 sec)
INFO:tensorflow:global_step/sec: 12.8463
INFO:tensorflow:loss = 1.248037, step = 90120 (7.789 sec)
INFO:tensorflow:lr = 0.00016169778 (7.790 sec)
INFO:tensorflow:global_step/sec: 12.7832
INFO:tensorflow:loss = 1.2473701, step = 90220 (7.818 sec)
INFO:tensorflow:lr = 0.00016153537 (7.819 sec)
INFO:tensorflow:global_step/sec: 12.9166
INFO:tensorflow:loss = 1.2491748, step = 90320 (7.747 sec)
INFO:tensorflow:lr = 0.00016137307 (7.747 sec)
INFO:tensorflow:global_step/sec: 12.7024
INFO:tensorflow:loss = 1.2531077, step = 90420 (7.871 sec)
INFO:tensorflow:lr = 0.00016121099 (7.871 sec)
INFO:tensorflow:global_step/sec: 12.6706
INFO:tensorflow:loss = 1.2527239, step = 90520 (7.894 sec)
INFO:tensorflow:lr = 0.00016104903 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.5734
INFO:tensorflow:loss = 1.2484795, step = 90620 (7.952 sec)
INFO:tensorflow:lr = 0.00016088727 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.621
INFO:tensorflow:loss = 1.2495238, step = 90720 (7.924 sec)
INFO:tensorflow:lr = 0.00016072566 (7.924 sec)
INFO:tensorflow:global_step/sec: 12.8078
INFO:tensorflow:loss = 1.2501513, step = 90820 (7.802 sec)
INFO:tensorflow:lr = 0.00016056419 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.96
INFO:tensorflow:loss = 1.2493507, step = 90920 (7.716 sec)
INFO:tensorflow:lr = 0.0001604029 (7.715 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.41387
INFO:tensorflow:loss = 1.2496051, step = 91020 (11.889 sec)
INFO:tensorflow:lr = 0.00016024178 (11.897 sec)
INFO:tensorflow:global_step/sec: 12.9541
INFO:tensorflow:loss = 1.247105, step = 91120 (7.718 sec)
INFO:tensorflow:lr = 0.00016008082 (7.710 sec)
INFO:tensorflow:global_step/sec: 12.7781
INFO:tensorflow:loss = 1.2484589, step = 91220 (7.825 sec)
INFO:tensorflow:lr = 0.00015992 (7.826 sec)
INFO:tensorflow:global_step/sec: 13.0741
INFO:tensorflow:loss = 1.2535778, step = 91320 (7.650 sec)
INFO:tensorflow:lr = 0.00015975937 (7.649 sec)
INFO:tensorflow:global_step/sec: 12.5744
INFO:tensorflow:loss = 1.255234, step = 91420 (7.952 sec)
INFO:tensorflow:lr = 0.00015959887 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.4252
INFO:tensorflow:loss = 1.2474556, step = 91520 (8.050 sec)
INFO:tensorflow:lr = 0.00015943855 (8.050 sec)
INFO:tensorflow:global_step/sec: 12.5663
INFO:tensorflow:loss = 1.245488, step = 91620 (7.954 sec)
INFO:tensorflow:lr = 0.0001592784 (7.955 sec)
INFO:tensorflow:global_step/sec: 12.7127
INFO:tensorflow:loss = 1.2660935, step = 91720 (7.866 sec)
INFO:tensorflow:lr = 0.0001591184 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.5399
INFO:tensorflow:loss = 1.2542043, step = 91820 (7.975 sec)
INFO:tensorflow:lr = 0.00015895854 (7.976 sec)
INFO:tensorflow:global_step/sec: 12.8243
INFO:tensorflow:loss = 1.250056, step = 91920 (7.798 sec)
INFO:tensorflow:lr = 0.00015879888 (7.806 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.35817
INFO:tensorflow:loss = 1.2492906, step = 92020 (11.971 sec)
INFO:tensorflow:lr = 0.00015863935 (11.962 sec)
INFO:tensorflow:global_step/sec: 12.9871
INFO:tensorflow:loss = 1.257855, step = 92120 (7.695 sec)
INFO:tensorflow:lr = 0.00015848 (7.695 sec)
INFO:tensorflow:global_step/sec: 12.8269
INFO:tensorflow:loss = 1.2487328, step = 92220 (7.795 sec)
INFO:tensorflow:lr = 0.0001583208 (7.799 sec)
INFO:tensorflow:global_step/sec: 12.7098
INFO:tensorflow:loss = 1.2490268, step = 92320 (7.870 sec)
INFO:tensorflow:lr = 0.00015816175 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.9235
INFO:tensorflow:loss = 1.2516989, step = 92420 (7.740 sec)
INFO:tensorflow:lr = 0.00015800289 (7.739 sec)
INFO:tensorflow:global_step/sec: 13.0381
INFO:tensorflow:loss = 1.2501904, step = 92520 (7.668 sec)
INFO:tensorflow:lr = 0.00015784417 (7.668 sec)
INFO:tensorflow:global_step/sec: 12.812
INFO:tensorflow:loss = 1.2477765, step = 92620 (7.809 sec)
INFO:tensorflow:lr = 0.00015768562 (7.810 sec)
INFO:tensorflow:global_step/sec: 12.697
INFO:tensorflow:loss = 1.2476797, step = 92720 (7.873 sec)
INFO:tensorflow:lr = 0.0001575272 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.7559
INFO:tensorflow:loss = 1.2522918, step = 92820 (7.838 sec)
INFO:tensorflow:lr = 0.00015736897 (7.837 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.66571
INFO:tensorflow:loss = 1.2524945, step = 92920 (11.542 sec)
INFO:tensorflow:lr = 0.00015721089 (11.544 sec)
INFO:tensorflow:global_step/sec: 12.7391
INFO:tensorflow:loss = 1.2476618, step = 93020 (7.850 sec)
INFO:tensorflow:lr = 0.00015705297 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.8889
INFO:tensorflow:loss = 1.2466986, step = 93120 (7.763 sec)
INFO:tensorflow:lr = 0.0001568952 (7.763 sec)
INFO:tensorflow:global_step/sec: 12.5188
INFO:tensorflow:loss = 1.2498853, step = 93220 (7.981 sec)
INFO:tensorflow:lr = 0.0001567376 (7.981 sec)
INFO:tensorflow:global_step/sec: 12.814
INFO:tensorflow:loss = 1.2529539, step = 93320 (7.804 sec)
INFO:tensorflow:lr = 0.00015658015 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.4364
INFO:tensorflow:loss = 1.251761, step = 93420 (8.041 sec)
INFO:tensorflow:lr = 0.00015642284 (8.041 sec)
INFO:tensorflow:global_step/sec: 12.9053
INFO:tensorflow:loss = 1.2578083, step = 93520 (7.749 sec)
INFO:tensorflow:lr = 0.00015626573 (7.751 sec)
INFO:tensorflow:global_step/sec: 13.0071
INFO:tensorflow:loss = 1.2468418, step = 93620 (7.687 sec)
INFO:tensorflow:lr = 0.00015610874 (7.686 sec)
INFO:tensorflow:global_step/sec: 12.4707
INFO:tensorflow:loss = 1.2501042, step = 93720 (8.023 sec)
INFO:tensorflow:lr = 0.00015595194 (8.026 sec)
INFO:tensorflow:global_step/sec: 12.5457
INFO:tensorflow:loss = 1.2522388, step = 93820 (7.966 sec)
INFO:tensorflow:lr = 0.00015579528 (7.968 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.2347
INFO:tensorflow:loss = 1.2465913, step = 93920 (10.833 sec)
INFO:tensorflow:lr = 0.00015563879 (10.830 sec)
INFO:tensorflow:global_step/sec: 12.9867
INFO:tensorflow:loss = 1.2459806, step = 94020 (7.702 sec)
INFO:tensorflow:lr = 0.00015548244 (7.702 sec)
INFO:tensorflow:global_step/sec: 12.8375
INFO:tensorflow:loss = 1.2477661, step = 94120 (7.789 sec)
INFO:tensorflow:lr = 0.00015532626 (7.789 sec)
INFO:tensorflow:global_step/sec: 12.7264
INFO:tensorflow:loss = 1.2550383, step = 94220 (7.857 sec)
INFO:tensorflow:lr = 0.00015517023 (7.856 sec)
INFO:tensorflow:global_step/sec: 12.756
INFO:tensorflow:loss = 1.2482506, step = 94320 (7.840 sec)
INFO:tensorflow:lr = 0.00015501435 (7.840 sec)
INFO:tensorflow:global_step/sec: 12.5792
INFO:tensorflow:loss = 1.2513517, step = 94420 (7.949 sec)
INFO:tensorflow:lr = 0.00015485863 (7.951 sec)
INFO:tensorflow:global_step/sec: 12.7862
INFO:tensorflow:loss = 1.2492919, step = 94520 (7.816 sec)
INFO:tensorflow:lr = 0.00015470307 (7.817 sec)
INFO:tensorflow:global_step/sec: 12.8749
INFO:tensorflow:loss = 1.2463424, step = 94620 (7.773 sec)
INFO:tensorflow:lr = 0.00015454767 (7.771 sec)
INFO:tensorflow:global_step/sec: 12.5792
INFO:tensorflow:loss = 1.245236, step = 94720 (7.944 sec)
INFO:tensorflow:lr = 0.00015439242 (7.944 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.961
INFO:tensorflow:loss = 1.2500908, step = 94820 (8.375 sec)
INFO:tensorflow:lr = 0.00015423732 (8.375 sec)
INFO:tensorflow:global_step/sec: 10.729
INFO:tensorflow:loss = 1.2478384, step = 94920 (9.307 sec)
INFO:tensorflow:lr = 0.00015408237 (9.309 sec)
INFO:tensorflow:global_step/sec: 12.6397
INFO:tensorflow:loss = 1.248349, step = 95020 (7.911 sec)
INFO:tensorflow:lr = 0.00015392763 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.7204
INFO:tensorflow:loss = 1.2496285, step = 95120 (7.862 sec)
INFO:tensorflow:lr = 0.000153773 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.7468
INFO:tensorflow:loss = 1.2597445, step = 95220 (7.848 sec)
INFO:tensorflow:lr = 0.00015361853 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.5758
INFO:tensorflow:loss = 1.2453961, step = 95320 (7.952 sec)
INFO:tensorflow:lr = 0.0001534642 (7.950 sec)
INFO:tensorflow:global_step/sec: 12.732
INFO:tensorflow:loss = 1.2543547, step = 95420 (7.852 sec)
INFO:tensorflow:lr = 0.00015331004 (7.852 sec)
INFO:tensorflow:global_step/sec: 12.5471
INFO:tensorflow:loss = 1.2571616, step = 95520 (7.971 sec)
INFO:tensorflow:lr = 0.00015315604 (7.972 sec)
INFO:tensorflow:global_step/sec: 12.8873
INFO:tensorflow:loss = 1.2492933, step = 95620 (7.761 sec)
INFO:tensorflow:lr = 0.0001530022 (7.759 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.9774
INFO:tensorflow:loss = 1.2539256, step = 95720 (7.708 sec)
INFO:tensorflow:lr = 0.0001528485 (7.709 sec)
INFO:tensorflow:global_step/sec: 10.8335
INFO:tensorflow:loss = 1.2586083, step = 95820 (9.226 sec)
INFO:tensorflow:lr = 0.00015269495 (9.226 sec)
INFO:tensorflow:global_step/sec: 12.9627
INFO:tensorflow:loss = 1.2478311, step = 95920 (7.717 sec)
INFO:tensorflow:lr = 0.00015254157 (7.716 sec)
INFO:tensorflow:global_step/sec: 12.7404
INFO:tensorflow:loss = 1.246582, step = 96020 (7.847 sec)
INFO:tensorflow:lr = 0.00015238834 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.8753
INFO:tensorflow:loss = 1.2462858, step = 96120 (7.763 sec)
INFO:tensorflow:lr = 0.00015223527 (7.763 sec)
INFO:tensorflow:global_step/sec: 12.7781
INFO:tensorflow:loss = 1.248619, step = 96220 (7.827 sec)
INFO:tensorflow:lr = 0.00015208234 (7.826 sec)
INFO:tensorflow:global_step/sec: 12.8999
INFO:tensorflow:loss = 1.2437112, step = 96320 (7.751 sec)
INFO:tensorflow:lr = 0.00015192956 (7.751 sec)
INFO:tensorflow:global_step/sec: 12.9556
INFO:tensorflow:loss = 1.2472332, step = 96420 (7.724 sec)
INFO:tensorflow:lr = 0.00015177694 (7.724 sec)
INFO:tensorflow:global_step/sec: 12.5363
INFO:tensorflow:loss = 1.2497894, step = 96520 (7.972 sec)
INFO:tensorflow:lr = 0.00015162448 (7.972 sec)
INFO:tensorflow:global_step/sec: 12.7175
INFO:tensorflow:loss = 1.2479632, step = 96620 (7.868 sec)
INFO:tensorflow:lr = 0.00015147217 (7.867 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.8365
INFO:tensorflow:loss = 1.2539418, step = 96720 (8.445 sec)
INFO:tensorflow:lr = 0.00015132003 (8.448 sec)
INFO:tensorflow:global_step/sec: 11.3935
INFO:tensorflow:loss = 1.246201, step = 96820 (8.780 sec)
INFO:tensorflow:lr = 0.000151168 (8.777 sec)
INFO:tensorflow:global_step/sec: 12.8646
INFO:tensorflow:loss = 1.2464495, step = 96920 (7.773 sec)
INFO:tensorflow:lr = 0.00015101615 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.8559
INFO:tensorflow:loss = 1.2489393, step = 97020 (7.776 sec)
INFO:tensorflow:lr = 0.00015086446 (7.777 sec)
INFO:tensorflow:global_step/sec: 12.755
INFO:tensorflow:loss = 1.2475141, step = 97120 (7.844 sec)
INFO:tensorflow:lr = 0.00015071292 (7.843 sec)
INFO:tensorflow:global_step/sec: 12.469
INFO:tensorflow:loss = 1.2522881, step = 97220 (8.019 sec)
INFO:tensorflow:lr = 0.00015056152 (8.019 sec)
INFO:tensorflow:global_step/sec: 12.8521
INFO:tensorflow:loss = 1.2474856, step = 97320 (7.775 sec)
INFO:tensorflow:lr = 0.00015041027 (7.777 sec)
INFO:tensorflow:global_step/sec: 13.0048
INFO:tensorflow:loss = 1.2518626, step = 97420 (7.691 sec)
INFO:tensorflow:lr = 0.00015025918 (7.692 sec)
INFO:tensorflow:global_step/sec: 12.8331
INFO:tensorflow:loss = 1.2469357, step = 97520 (7.797 sec)
INFO:tensorflow:lr = 0.00015010824 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.8551
INFO:tensorflow:loss = 1.2467525, step = 97620 (7.774 sec)
INFO:tensorflow:lr = 0.00014995746 (7.774 sec)
INFO:tensorflow:global_step/sec: 12.8103
INFO:tensorflow:loss = 1.2500345, step = 97720 (7.811 sec)
INFO:tensorflow:lr = 0.00014980682 (7.811 sec)
INFO:tensorflow:Saving checkpoints for 97800 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2452809.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-97800
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-97800
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.721
INFO:tensorflow:Best (Exact Match) Accuracy: 0.721
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-97800
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 97800 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2478939, step = 97800
INFO:tensorflow:lr = 0.00014968641
INFO:tensorflow:global_step/sec: 10.2999
INFO:tensorflow:loss = 1.2530776, step = 97900 (9.710 sec)
INFO:tensorflow:lr = 0.00014953606 (9.710 sec)
INFO:tensorflow:global_step/sec: 12.5138
INFO:tensorflow:loss = 1.2495674, step = 98000 (7.999 sec)
INFO:tensorflow:lr = 0.00014938583 (7.998 sec)
INFO:tensorflow:global_step/sec: 12.6598
INFO:tensorflow:loss = 1.2456689, step = 98100 (7.892 sec)
INFO:tensorflow:lr = 0.00014923578 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.7983
INFO:tensorflow:loss = 1.2530382, step = 98200 (7.815 sec)
INFO:tensorflow:lr = 0.00014908587 (7.814 sec)
INFO:tensorflow:global_step/sec: 12.7198
INFO:tensorflow:loss = 1.2474073, step = 98300 (7.867 sec)
INFO:tensorflow:lr = 0.00014893612 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.7548
INFO:tensorflow:loss = 1.2511063, step = 98400 (7.839 sec)
INFO:tensorflow:lr = 0.00014878651 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.6978
INFO:tensorflow:loss = 1.2448481, step = 98500 (7.877 sec)
INFO:tensorflow:lr = 0.00014863703 (7.878 sec)
INFO:tensorflow:global_step/sec: 12.9897
INFO:tensorflow:loss = 1.2509502, step = 98600 (7.692 sec)
INFO:tensorflow:lr = 0.00014848771 (7.690 sec)
INFO:tensorflow:global_step/sec: 12.8457
INFO:tensorflow:loss = 1.2510892, step = 98700 (7.785 sec)
INFO:tensorflow:lr = 0.00014833857 (7.785 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.35826
INFO:tensorflow:loss = 1.2454256, step = 98800 (11.964 sec)
INFO:tensorflow:lr = 0.00014818956 (11.964 sec)
INFO:tensorflow:global_step/sec: 12.6956
INFO:tensorflow:loss = 1.2526236, step = 98900 (7.882 sec)
INFO:tensorflow:lr = 0.0001480407 (7.881 sec)
INFO:tensorflow:global_step/sec: 12.6931
INFO:tensorflow:loss = 1.2457856, step = 99000 (7.879 sec)
INFO:tensorflow:lr = 0.00014789199 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.7124
INFO:tensorflow:loss = 1.2481877, step = 99100 (7.865 sec)
INFO:tensorflow:lr = 0.00014774341 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.9415
INFO:tensorflow:loss = 1.2529738, step = 99200 (7.725 sec)
INFO:tensorflow:lr = 0.00014759501 (7.728 sec)
INFO:tensorflow:global_step/sec: 12.51
INFO:tensorflow:loss = 1.2549247, step = 99300 (7.996 sec)
INFO:tensorflow:lr = 0.00014744674 (7.993 sec)
INFO:tensorflow:global_step/sec: 12.8669
INFO:tensorflow:loss = 1.2506918, step = 99400 (7.773 sec)
INFO:tensorflow:lr = 0.00014729865 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.9446
INFO:tensorflow:loss = 1.251098, step = 99500 (7.724 sec)
INFO:tensorflow:lr = 0.00014715067 (7.724 sec)
INFO:tensorflow:global_step/sec: 12.9673
INFO:tensorflow:loss = 1.2509713, step = 99600 (7.708 sec)
INFO:tensorflow:lr = 0.00014700285 (7.713 sec)
INFO:tensorflow:global_step/sec: 12.8537
INFO:tensorflow:loss = 1.2475537, step = 99700 (7.779 sec)
INFO:tensorflow:lr = 0.0001468552 (7.774 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.30087
INFO:tensorflow:loss = 1.249899, step = 99800 (12.051 sec)
INFO:tensorflow:lr = 0.00014670768 (12.050 sec)
INFO:tensorflow:global_step/sec: 12.6009
INFO:tensorflow:loss = 1.2500576, step = 99900 (7.939 sec)
INFO:tensorflow:lr = 0.00014656028 (7.939 sec)
INFO:tensorflow:global_step/sec: 12.6469
INFO:tensorflow:loss = 1.2471527, step = 100000 (7.902 sec)
INFO:tensorflow:lr = 0.00014641306 (7.905 sec)
INFO:tensorflow:global_step/sec: 12.8393
INFO:tensorflow:loss = 1.2491647, step = 100100 (7.791 sec)
INFO:tensorflow:lr = 0.00014626599 (7.788 sec)
INFO:tensorflow:global_step/sec: 12.4661
INFO:tensorflow:loss = 1.2583389, step = 100200 (8.018 sec)
INFO:tensorflow:lr = 0.00014611905 (8.018 sec)
INFO:tensorflow:global_step/sec: 12.7297
INFO:tensorflow:loss = 1.2637594, step = 100300 (7.856 sec)
INFO:tensorflow:lr = 0.00014597227 (7.856 sec)
INFO:tensorflow:global_step/sec: 13.0237
INFO:tensorflow:loss = 1.2442552, step = 100400 (7.679 sec)
INFO:tensorflow:lr = 0.00014582566 (7.679 sec)
INFO:tensorflow:global_step/sec: 13.0379
INFO:tensorflow:loss = 1.2445681, step = 100500 (7.670 sec)
INFO:tensorflow:lr = 0.00014567917 (7.671 sec)
INFO:tensorflow:global_step/sec: 12.9349
INFO:tensorflow:loss = 1.2465498, step = 100600 (7.731 sec)
INFO:tensorflow:lr = 0.00014553282 (7.730 sec)
INFO:tensorflow:global_step/sec: 12.8189
INFO:tensorflow:loss = 1.250596, step = 100700 (7.803 sec)
INFO:tensorflow:lr = 0.00014538663 (7.803 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.28172
INFO:tensorflow:loss = 1.2455262, step = 100800 (12.075 sec)
INFO:tensorflow:lr = 0.0001452406 (12.075 sec)
INFO:tensorflow:global_step/sec: 12.9382
INFO:tensorflow:loss = 1.2536768, step = 100900 (7.732 sec)
INFO:tensorflow:lr = 0.0001450947 (7.732 sec)
INFO:tensorflow:global_step/sec: 12.7612
INFO:tensorflow:loss = 1.2488126, step = 101000 (7.836 sec)
INFO:tensorflow:lr = 0.00014494894 (7.835 sec)
INFO:tensorflow:global_step/sec: 12.9549
INFO:tensorflow:loss = 1.2458501, step = 101100 (7.714 sec)
INFO:tensorflow:lr = 0.00014480333 (7.716 sec)
INFO:tensorflow:global_step/sec: 12.6402
INFO:tensorflow:loss = 1.2484591, step = 101200 (7.912 sec)
INFO:tensorflow:lr = 0.00014465788 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.4116
INFO:tensorflow:loss = 1.2440362, step = 101300 (8.059 sec)
INFO:tensorflow:lr = 0.00014451255 (8.059 sec)
INFO:tensorflow:global_step/sec: 12.6824
INFO:tensorflow:loss = 1.2500799, step = 101400 (7.882 sec)
INFO:tensorflow:lr = 0.00014436738 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.6559
INFO:tensorflow:loss = 1.2466154, step = 101500 (7.901 sec)
INFO:tensorflow:lr = 0.00014422236 (7.900 sec)
INFO:tensorflow:global_step/sec: 13.0559
INFO:tensorflow:loss = 1.2482994, step = 101600 (7.660 sec)
INFO:tensorflow:lr = 0.0001440775 (7.660 sec)
INFO:tensorflow:global_step/sec: 12.8514
INFO:tensorflow:loss = 1.2523829, step = 101700 (7.785 sec)
INFO:tensorflow:lr = 0.00014393278 (7.784 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.45087
INFO:tensorflow:loss = 1.2452083, step = 101800 (11.835 sec)
INFO:tensorflow:lr = 0.00014378819 (11.835 sec)
INFO:tensorflow:global_step/sec: 12.569
INFO:tensorflow:loss = 1.2493188, step = 101900 (7.951 sec)
INFO:tensorflow:lr = 0.00014364375 (7.951 sec)
INFO:tensorflow:global_step/sec: 12.8148
INFO:tensorflow:loss = 1.2473443, step = 102000 (7.804 sec)
INFO:tensorflow:lr = 0.00014349945 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.4523
INFO:tensorflow:loss = 1.2531881, step = 102100 (8.030 sec)
INFO:tensorflow:lr = 0.00014335531 (8.030 sec)
INFO:tensorflow:global_step/sec: 12.6382
INFO:tensorflow:loss = 1.2482383, step = 102200 (7.913 sec)
INFO:tensorflow:lr = 0.0001432113 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.8723
INFO:tensorflow:loss = 1.2539681, step = 102300 (7.768 sec)
INFO:tensorflow:lr = 0.00014306743 (7.771 sec)
INFO:tensorflow:global_step/sec: 12.9976
INFO:tensorflow:loss = 1.2506423, step = 102400 (7.699 sec)
INFO:tensorflow:lr = 0.00014292373 (7.697 sec)
INFO:tensorflow:global_step/sec: 12.6729
INFO:tensorflow:loss = 1.2471061, step = 102500 (7.890 sec)
INFO:tensorflow:lr = 0.00014278015 (7.889 sec)
INFO:tensorflow:global_step/sec: 13.0785
INFO:tensorflow:loss = 1.253192, step = 102600 (7.642 sec)
INFO:tensorflow:lr = 0.00014263671 (7.642 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.65168
INFO:tensorflow:loss = 1.2455392, step = 102700 (11.565 sec)
INFO:tensorflow:lr = 0.00014249345 (11.565 sec)
INFO:tensorflow:global_step/sec: 12.6778
INFO:tensorflow:loss = 1.2455585, step = 102800 (7.882 sec)
INFO:tensorflow:lr = 0.0001423503 (7.882 sec)
INFO:tensorflow:global_step/sec: 12.9287
INFO:tensorflow:loss = 1.2474979, step = 102900 (7.735 sec)
INFO:tensorflow:lr = 0.00014220731 (7.736 sec)
INFO:tensorflow:global_step/sec: 12.5712
INFO:tensorflow:loss = 1.2525347, step = 103000 (7.958 sec)
INFO:tensorflow:lr = 0.00014206445 (7.957 sec)
INFO:tensorflow:global_step/sec: 12.7429
INFO:tensorflow:loss = 1.2527738, step = 103100 (7.848 sec)
INFO:tensorflow:lr = 0.00014192174 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.8437
INFO:tensorflow:loss = 1.2513976, step = 103200 (7.782 sec)
INFO:tensorflow:lr = 0.00014177918 (7.782 sec)
INFO:tensorflow:global_step/sec: 13.1909
INFO:tensorflow:loss = 1.2616798, step = 103300 (7.585 sec)
INFO:tensorflow:lr = 0.00014163676 (7.585 sec)
INFO:tensorflow:global_step/sec: 12.7898
INFO:tensorflow:loss = 1.2459317, step = 103400 (7.819 sec)
INFO:tensorflow:lr = 0.00014149447 (7.817 sec)
INFO:tensorflow:global_step/sec: 12.7356
INFO:tensorflow:loss = 1.2490375, step = 103500 (7.847 sec)
INFO:tensorflow:lr = 0.00014135234 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.6504
INFO:tensorflow:loss = 1.2508307, step = 103600 (7.908 sec)
INFO:tensorflow:lr = 0.00014121036 (7.907 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.35231
INFO:tensorflow:loss = 1.2476784, step = 103700 (10.694 sec)
INFO:tensorflow:lr = 0.00014106852 (10.697 sec)
INFO:tensorflow:global_step/sec: 12.7486
INFO:tensorflow:loss = 1.2524669, step = 103800 (7.845 sec)
INFO:tensorflow:lr = 0.0001409268 (7.843 sec)
INFO:tensorflow:global_step/sec: 12.73
INFO:tensorflow:loss = 1.247279, step = 103900 (7.855 sec)
INFO:tensorflow:lr = 0.00014078524 (7.856 sec)
INFO:tensorflow:global_step/sec: 12.6726
INFO:tensorflow:loss = 1.2515517, step = 104000 (7.890 sec)
INFO:tensorflow:lr = 0.00014064382 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.5949
INFO:tensorflow:loss = 1.243661, step = 104100 (7.935 sec)
INFO:tensorflow:lr = 0.00014050253 (7.935 sec)
INFO:tensorflow:global_step/sec: 12.8437
INFO:tensorflow:loss = 1.2481575, step = 104200 (7.786 sec)
INFO:tensorflow:lr = 0.00014036139 (7.786 sec)
INFO:tensorflow:global_step/sec: 12.7226
INFO:tensorflow:loss = 1.2454779, step = 104300 (7.866 sec)
INFO:tensorflow:lr = 0.00014022039 (7.866 sec)
INFO:tensorflow:global_step/sec: 13.1483
INFO:tensorflow:loss = 1.2469022, step = 104400 (7.601 sec)
INFO:tensorflow:lr = 0.00014007956 (7.603 sec)
INFO:tensorflow:global_step/sec: 12.7578
INFO:tensorflow:loss = 1.2458844, step = 104500 (7.843 sec)
INFO:tensorflow:lr = 0.00013993881 (7.841 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0438
INFO:tensorflow:loss = 1.2457703, step = 104600 (8.302 sec)
INFO:tensorflow:lr = 0.00013979826 (8.302 sec)
INFO:tensorflow:global_step/sec: 10.6714
INFO:tensorflow:loss = 1.2621123, step = 104700 (9.368 sec)
INFO:tensorflow:lr = 0.0001396578 (9.369 sec)
INFO:tensorflow:global_step/sec: 12.7622
INFO:tensorflow:loss = 1.252069, step = 104800 (7.839 sec)
INFO:tensorflow:lr = 0.00013951753 (7.838 sec)
INFO:tensorflow:global_step/sec: 12.8765
INFO:tensorflow:loss = 1.2471956, step = 104900 (7.769 sec)
INFO:tensorflow:lr = 0.00013937739 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.6423
INFO:tensorflow:loss = 1.2450892, step = 105000 (7.908 sec)
INFO:tensorflow:lr = 0.00013923737 (7.909 sec)
INFO:tensorflow:global_step/sec: 12.8286
INFO:tensorflow:loss = 1.2544929, step = 105100 (7.793 sec)
INFO:tensorflow:lr = 0.0001390975 (7.793 sec)
INFO:tensorflow:global_step/sec: 12.5893
INFO:tensorflow:loss = 1.247633, step = 105200 (7.940 sec)
INFO:tensorflow:lr = 0.00013895777 (7.939 sec)
INFO:tensorflow:global_step/sec: 13.1147
INFO:tensorflow:loss = 1.2575452, step = 105300 (7.630 sec)
INFO:tensorflow:lr = 0.00013881818 (7.630 sec)
INFO:tensorflow:global_step/sec: 12.8288
INFO:tensorflow:loss = 1.2458938, step = 105400 (7.789 sec)
INFO:tensorflow:lr = 0.00013867875 (7.792 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.4148
INFO:tensorflow:loss = 1.2475997, step = 105500 (8.062 sec)
INFO:tensorflow:lr = 0.00013853943 (8.060 sec)
INFO:tensorflow:global_step/sec: 11.1919
INFO:tensorflow:loss = 1.2466756, step = 105600 (8.932 sec)
INFO:tensorflow:lr = 0.00013840027 (8.931 sec)
INFO:tensorflow:global_step/sec: 13.0127
INFO:tensorflow:loss = 1.2510452, step = 105700 (7.686 sec)
INFO:tensorflow:lr = 0.00013826125 (7.686 sec)
INFO:tensorflow:global_step/sec: 12.7357
INFO:tensorflow:loss = 1.2437646, step = 105800 (7.850 sec)
INFO:tensorflow:lr = 0.00013812236 (7.849 sec)
INFO:tensorflow:global_step/sec: 12.5414
INFO:tensorflow:loss = 1.2473345, step = 105900 (7.970 sec)
INFO:tensorflow:lr = 0.0001379836 (7.972 sec)
INFO:tensorflow:global_step/sec: 13.1739
INFO:tensorflow:loss = 1.2456942, step = 106000 (7.591 sec)
INFO:tensorflow:lr = 0.000137845 (7.591 sec)
INFO:tensorflow:global_step/sec: 12.8703
INFO:tensorflow:loss = 1.2483459, step = 106100 (7.776 sec)
INFO:tensorflow:lr = 0.00013770652 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.7021
INFO:tensorflow:loss = 1.24482, step = 106200 (7.872 sec)
INFO:tensorflow:lr = 0.00013756819 (7.872 sec)
INFO:tensorflow:global_step/sec: 12.8143
INFO:tensorflow:loss = 1.2478292, step = 106300 (7.801 sec)
INFO:tensorflow:lr = 0.00013743 (7.802 sec)
INFO:tensorflow:global_step/sec: 12.9085
INFO:tensorflow:loss = 1.2532618, step = 106400 (7.749 sec)
INFO:tensorflow:lr = 0.00013729198 (7.749 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.9567
INFO:tensorflow:loss = 1.2503626, step = 106500 (8.363 sec)
INFO:tensorflow:lr = 0.00013715404 (8.363 sec)
INFO:tensorflow:global_step/sec: 11.4986
INFO:tensorflow:loss = 1.2475023, step = 106600 (8.699 sec)
INFO:tensorflow:lr = 0.00013701625 (8.699 sec)
INFO:tensorflow:global_step/sec: 12.6916
INFO:tensorflow:loss = 1.246882, step = 106700 (7.875 sec)
INFO:tensorflow:lr = 0.00013687865 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.9143
INFO:tensorflow:loss = 1.2436101, step = 106800 (7.745 sec)
INFO:tensorflow:lr = 0.00013674115 (7.744 sec)
INFO:tensorflow:global_step/sec: 12.8539
INFO:tensorflow:loss = 1.2468636, step = 106900 (7.779 sec)
INFO:tensorflow:lr = 0.00013660378 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.7943
INFO:tensorflow:loss = 1.2541093, step = 107000 (7.816 sec)
INFO:tensorflow:lr = 0.00013646655 (7.816 sec)
INFO:tensorflow:global_step/sec: 12.9027
INFO:tensorflow:loss = 1.2474351, step = 107100 (7.750 sec)
INFO:tensorflow:lr = 0.00013632947 (7.750 sec)
INFO:tensorflow:global_step/sec: 13.1961
INFO:tensorflow:loss = 1.2451929, step = 107200 (7.574 sec)
INFO:tensorflow:lr = 0.00013619252 (7.578 sec)
INFO:tensorflow:global_step/sec: 12.5269
INFO:tensorflow:loss = 1.2497258, step = 107300 (7.987 sec)
INFO:tensorflow:lr = 0.00013605572 (7.982 sec)
INFO:tensorflow:global_step/sec: 12.5849
INFO:tensorflow:loss = 1.2448314, step = 107400 (7.946 sec)
INFO:tensorflow:lr = 0.00013591905 (7.946 sec)
INFO:tensorflow:global_step/sec: 12.951
INFO:tensorflow:loss = 1.2444179, step = 107500 (7.717 sec)
INFO:tensorflow:lr = 0.00013578251 (7.719 sec)
INFO:tensorflow:Saving checkpoints for 107580 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2442379.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-107580
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-107580
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.723
INFO:tensorflow:Best (Exact Match) Accuracy: 0.723
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-107580
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 107580 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2489259, step = 107580
INFO:tensorflow:lr = 0.00013567338
INFO:tensorflow:global_step/sec: 10.4098
INFO:tensorflow:loss = 1.2465535, step = 107680 (9.612 sec)
INFO:tensorflow:lr = 0.00013553708 (9.612 sec)
INFO:tensorflow:global_step/sec: 12.4733
INFO:tensorflow:loss = 1.249318, step = 107780 (8.013 sec)
INFO:tensorflow:lr = 0.00013540093 (8.012 sec)
INFO:tensorflow:global_step/sec: 12.822
INFO:tensorflow:loss = 1.2475603, step = 107880 (7.800 sec)
INFO:tensorflow:lr = 0.00013526493 (7.802 sec)
INFO:tensorflow:global_step/sec: 13.0186
INFO:tensorflow:loss = 1.2548482, step = 107980 (7.688 sec)
INFO:tensorflow:lr = 0.00013512906 (7.691 sec)
INFO:tensorflow:global_step/sec: 12.6619
INFO:tensorflow:loss = 1.247991, step = 108080 (7.895 sec)
INFO:tensorflow:lr = 0.00013499332 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.4877
INFO:tensorflow:loss = 1.2462689, step = 108180 (8.008 sec)
INFO:tensorflow:lr = 0.00013485769 (8.006 sec)
INFO:tensorflow:global_step/sec: 12.7378
INFO:tensorflow:loss = 1.2458864, step = 108280 (7.845 sec)
INFO:tensorflow:lr = 0.00013472223 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.869
INFO:tensorflow:loss = 1.2465334, step = 108380 (7.783 sec)
INFO:tensorflow:lr = 0.00013458691 (7.784 sec)
INFO:tensorflow:global_step/sec: 12.3673
INFO:tensorflow:loss = 1.2464366, step = 108480 (8.074 sec)
INFO:tensorflow:lr = 0.00013445171 (8.075 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.4047
INFO:tensorflow:loss = 1.2486157, step = 108580 (11.904 sec)
INFO:tensorflow:lr = 0.00013431665 (11.903 sec)
INFO:tensorflow:global_step/sec: 12.9262
INFO:tensorflow:loss = 1.2478218, step = 108680 (7.734 sec)
INFO:tensorflow:lr = 0.00013418171 (7.733 sec)
INFO:tensorflow:global_step/sec: 12.7297
INFO:tensorflow:loss = 1.2497544, step = 108780 (7.853 sec)
INFO:tensorflow:lr = 0.00013404692 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.6782
INFO:tensorflow:loss = 1.2516304, step = 108880 (7.887 sec)
INFO:tensorflow:lr = 0.00013391227 (7.885 sec)
INFO:tensorflow:global_step/sec: 12.8279
INFO:tensorflow:loss = 1.2466173, step = 108980 (7.797 sec)
INFO:tensorflow:lr = 0.00013377776 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.6044
INFO:tensorflow:loss = 1.2438627, step = 109080 (7.936 sec)
INFO:tensorflow:lr = 0.00013364338 (7.937 sec)
INFO:tensorflow:global_step/sec: 12.5006
INFO:tensorflow:loss = 1.2459699, step = 109180 (7.995 sec)
INFO:tensorflow:lr = 0.00013350912 (7.999 sec)
INFO:tensorflow:global_step/sec: 12.3132
INFO:tensorflow:loss = 1.2494336, step = 109280 (8.128 sec)
INFO:tensorflow:lr = 0.00013337501 (8.123 sec)
INFO:tensorflow:global_step/sec: 12.6142
INFO:tensorflow:loss = 1.2490482, step = 109380 (7.923 sec)
INFO:tensorflow:lr = 0.00013324103 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.9434
INFO:tensorflow:loss = 1.244992, step = 109480 (7.731 sec)
INFO:tensorflow:lr = 0.00013310718 (7.727 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.42797
INFO:tensorflow:loss = 1.246099, step = 109580 (11.859 sec)
INFO:tensorflow:lr = 0.00013297348 (11.860 sec)
INFO:tensorflow:global_step/sec: 12.7311
INFO:tensorflow:loss = 1.2468445, step = 109680 (7.856 sec)
INFO:tensorflow:lr = 0.00013283991 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.4444
INFO:tensorflow:loss = 1.2453207, step = 109780 (8.036 sec)
INFO:tensorflow:lr = 0.00013270645 (8.041 sec)
INFO:tensorflow:global_step/sec: 12.396
INFO:tensorflow:loss = 1.247017, step = 109880 (8.070 sec)
INFO:tensorflow:lr = 0.00013257316 (8.066 sec)
INFO:tensorflow:global_step/sec: 12.881
INFO:tensorflow:loss = 1.2435148, step = 109980 (7.759 sec)
INFO:tensorflow:lr = 0.00013244 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.5229
INFO:tensorflow:loss = 1.2592441, step = 110080 (7.990 sec)
INFO:tensorflow:lr = 0.00013230696 (7.990 sec)
INFO:tensorflow:global_step/sec: 12.6508
INFO:tensorflow:loss = 1.2503728, step = 110180 (7.900 sec)
INFO:tensorflow:lr = 0.00013217404 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.2981
INFO:tensorflow:loss = 1.2484401, step = 110280 (8.134 sec)
INFO:tensorflow:lr = 0.00013204126 (8.134 sec)
INFO:tensorflow:global_step/sec: 12.6796
INFO:tensorflow:loss = 1.2463096, step = 110380 (7.885 sec)
INFO:tensorflow:lr = 0.00013190863 (7.886 sec)
INFO:tensorflow:global_step/sec: 12.2949
INFO:tensorflow:loss = 1.2451106, step = 110480 (8.141 sec)
INFO:tensorflow:lr = 0.00013177612 (8.138 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.84506
INFO:tensorflow:loss = 1.2448896, step = 110580 (12.743 sec)
INFO:tensorflow:lr = 0.00013164374 (12.744 sec)
INFO:tensorflow:global_step/sec: 12.412
INFO:tensorflow:loss = 1.2469372, step = 110680 (8.057 sec)
INFO:tensorflow:lr = 0.0001315115 (8.056 sec)
INFO:tensorflow:global_step/sec: 12.3222
INFO:tensorflow:loss = 1.2455852, step = 110780 (8.112 sec)
INFO:tensorflow:lr = 0.0001313794 (8.113 sec)
INFO:tensorflow:global_step/sec: 11.929
INFO:tensorflow:loss = 1.2448218, step = 110880 (8.381 sec)
INFO:tensorflow:lr = 0.00013124742 (8.379 sec)
INFO:tensorflow:global_step/sec: 12.2422
INFO:tensorflow:loss = 1.2461655, step = 110980 (8.168 sec)
INFO:tensorflow:lr = 0.0001311156 (8.168 sec)
INFO:tensorflow:global_step/sec: 12.5866
INFO:tensorflow:loss = 1.2536453, step = 111080 (7.951 sec)
INFO:tensorflow:lr = 0.00013098388 (7.951 sec)
INFO:tensorflow:global_step/sec: 12.4155
INFO:tensorflow:loss = 1.2434506, step = 111180 (8.055 sec)
INFO:tensorflow:lr = 0.00013085229 (8.059 sec)
INFO:tensorflow:global_step/sec: 12.2427
INFO:tensorflow:loss = 1.2464231, step = 111280 (8.167 sec)
INFO:tensorflow:lr = 0.00013072084 (8.166 sec)
INFO:tensorflow:global_step/sec: 12.5907
INFO:tensorflow:loss = 1.2453758, step = 111380 (7.938 sec)
INFO:tensorflow:lr = 0.00013058954 (7.937 sec)
INFO:tensorflow:global_step/sec: 12.716
INFO:tensorflow:loss = 1.2442877, step = 111480 (7.864 sec)
INFO:tensorflow:lr = 0.00013045836 (7.866 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.21248
INFO:tensorflow:loss = 1.2450273, step = 111580 (12.182 sec)
INFO:tensorflow:lr = 0.00013032732 (12.177 sec)
INFO:tensorflow:global_step/sec: 12.3679
INFO:tensorflow:loss = 1.2450981, step = 111680 (8.082 sec)
INFO:tensorflow:lr = 0.0001301964 (8.086 sec)
INFO:tensorflow:global_step/sec: 12.2747
INFO:tensorflow:loss = 1.2465881, step = 111780 (8.144 sec)
INFO:tensorflow:lr = 0.0001300656 (8.141 sec)
INFO:tensorflow:global_step/sec: 12.6075
INFO:tensorflow:loss = 1.2524883, step = 111880 (7.933 sec)
INFO:tensorflow:lr = 0.00012993495 (7.933 sec)
INFO:tensorflow:global_step/sec: 12.1696
INFO:tensorflow:loss = 1.2459798, step = 111980 (8.216 sec)
INFO:tensorflow:lr = 0.00012980442 (8.217 sec)
INFO:tensorflow:global_step/sec: 12.4295
INFO:tensorflow:loss = 1.2500193, step = 112080 (8.049 sec)
INFO:tensorflow:lr = 0.00012967402 (8.049 sec)
INFO:tensorflow:global_step/sec: 12.3575
INFO:tensorflow:loss = 1.2450176, step = 112180 (8.088 sec)
INFO:tensorflow:lr = 0.00012954377 (8.088 sec)
INFO:tensorflow:global_step/sec: 12.4561
INFO:tensorflow:loss = 1.2457551, step = 112280 (8.034 sec)
INFO:tensorflow:lr = 0.00012941365 (8.034 sec)
INFO:tensorflow:global_step/sec: 12.7345
INFO:tensorflow:loss = 1.2456206, step = 112380 (7.853 sec)
INFO:tensorflow:lr = 0.00012928365 (7.853 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.4965
INFO:tensorflow:loss = 1.2451046, step = 112480 (11.770 sec)
INFO:tensorflow:lr = 0.00012915379 (11.775 sec)
INFO:tensorflow:global_step/sec: 12.5032
INFO:tensorflow:loss = 1.2449356, step = 112580 (7.997 sec)
INFO:tensorflow:lr = 0.00012902405 (7.991 sec)
INFO:tensorflow:global_step/sec: 12.4797
INFO:tensorflow:loss = 1.2540485, step = 112680 (8.008 sec)
INFO:tensorflow:lr = 0.00012889442 (8.010 sec)
INFO:tensorflow:global_step/sec: 12.4347
INFO:tensorflow:loss = 1.2504659, step = 112780 (8.048 sec)
INFO:tensorflow:lr = 0.00012876495 (8.047 sec)
INFO:tensorflow:global_step/sec: 12.3055
INFO:tensorflow:loss = 1.2495759, step = 112880 (8.123 sec)
INFO:tensorflow:lr = 0.00012863561 (8.123 sec)
INFO:tensorflow:global_step/sec: 12.5325
INFO:tensorflow:loss = 1.2485863, step = 112980 (7.979 sec)
INFO:tensorflow:lr = 0.00012850638 (7.981 sec)
INFO:tensorflow:global_step/sec: 12.3319
INFO:tensorflow:loss = 1.2465398, step = 113080 (8.107 sec)
INFO:tensorflow:lr = 0.00012837729 (8.112 sec)
INFO:tensorflow:global_step/sec: 12.3829
INFO:tensorflow:loss = 1.2465779, step = 113180 (8.076 sec)
INFO:tensorflow:lr = 0.00012824834 (8.069 sec)
INFO:tensorflow:global_step/sec: 12.6251
INFO:tensorflow:loss = 1.245736, step = 113280 (7.925 sec)
INFO:tensorflow:lr = 0.0001281195 (7.926 sec)
INFO:tensorflow:global_step/sec: 12.3343
INFO:tensorflow:loss = 1.243198, step = 113380 (8.106 sec)
INFO:tensorflow:lr = 0.0001279908 (8.109 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.77301
INFO:tensorflow:loss = 1.2464836, step = 113480 (11.396 sec)
INFO:tensorflow:lr = 0.00012786225 (11.392 sec)
INFO:tensorflow:global_step/sec: 12.4675
INFO:tensorflow:loss = 1.2475723, step = 113580 (8.026 sec)
INFO:tensorflow:lr = 0.0001277338 (8.026 sec)
INFO:tensorflow:global_step/sec: 12.5777
INFO:tensorflow:loss = 1.2461356, step = 113680 (7.945 sec)
INFO:tensorflow:lr = 0.00012760548 (7.945 sec)
INFO:tensorflow:global_step/sec: 12.383
INFO:tensorflow:loss = 1.2514325, step = 113780 (8.077 sec)
INFO:tensorflow:lr = 0.0001274773 (8.080 sec)
INFO:tensorflow:global_step/sec: 12.3492
INFO:tensorflow:loss = 1.2455924, step = 113880 (8.096 sec)
INFO:tensorflow:lr = 0.00012734925 (8.095 sec)
INFO:tensorflow:global_step/sec: 12.3347
INFO:tensorflow:loss = 1.2465392, step = 113980 (8.108 sec)
INFO:tensorflow:lr = 0.00012722133 (8.107 sec)
INFO:tensorflow:global_step/sec: 12.4384
INFO:tensorflow:loss = 1.2566938, step = 114080 (8.044 sec)
INFO:tensorflow:lr = 0.00012709353 (8.043 sec)
INFO:tensorflow:global_step/sec: 12.5175
INFO:tensorflow:loss = 1.2492527, step = 114180 (7.983 sec)
INFO:tensorflow:lr = 0.00012696585 (7.988 sec)
INFO:tensorflow:global_step/sec: 12.4114
INFO:tensorflow:loss = 1.2554555, step = 114280 (8.063 sec)
INFO:tensorflow:lr = 0.00012683832 (8.058 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.6301
INFO:tensorflow:loss = 1.248702, step = 114380 (8.610 sec)
INFO:tensorflow:lr = 0.0001267109 (8.611 sec)
INFO:tensorflow:global_step/sec: 10.0063
INFO:tensorflow:loss = 1.25149, step = 114480 (9.980 sec)
INFO:tensorflow:lr = 0.00012658362 (9.982 sec)
INFO:tensorflow:global_step/sec: 11.686
INFO:tensorflow:loss = 1.2474595, step = 114580 (8.554 sec)
INFO:tensorflow:lr = 0.00012645648 (8.552 sec)
INFO:tensorflow:global_step/sec: 12.569
INFO:tensorflow:loss = 1.2511866, step = 114680 (7.956 sec)
INFO:tensorflow:lr = 0.00012632943 (7.955 sec)
INFO:tensorflow:global_step/sec: 12.6191
INFO:tensorflow:loss = 1.2508888, step = 114780 (7.935 sec)
INFO:tensorflow:lr = 0.00012620253 (7.935 sec)
INFO:tensorflow:global_step/sec: 12.1091
INFO:tensorflow:loss = 1.2474946, step = 114880 (8.257 sec)
INFO:tensorflow:lr = 0.00012607576 (8.256 sec)
INFO:tensorflow:global_step/sec: 12.4553
INFO:tensorflow:loss = 1.2473083, step = 114980 (8.023 sec)
INFO:tensorflow:lr = 0.00012594911 (8.024 sec)
INFO:tensorflow:global_step/sec: 12.4882
INFO:tensorflow:loss = 1.2468796, step = 115080 (8.005 sec)
INFO:tensorflow:lr = 0.0001258226 (8.005 sec)
INFO:tensorflow:global_step/sec: 12.3851
INFO:tensorflow:loss = 1.2520475, step = 115180 (8.079 sec)
INFO:tensorflow:lr = 0.0001256962 (8.079 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2298
INFO:tensorflow:loss = 1.2488706, step = 115280 (8.174 sec)
INFO:tensorflow:lr = 0.00012556993 (8.177 sec)
INFO:tensorflow:global_step/sec: 10.543
INFO:tensorflow:loss = 1.2459799, step = 115380 (9.498 sec)
INFO:tensorflow:lr = 0.0001254438 (9.495 sec)
INFO:tensorflow:global_step/sec: 12.1713
INFO:tensorflow:loss = 1.2485315, step = 115480 (8.202 sec)
INFO:tensorflow:lr = 0.00012531779 (8.202 sec)
INFO:tensorflow:global_step/sec: 12.2389
INFO:tensorflow:loss = 1.2580112, step = 115580 (8.170 sec)
INFO:tensorflow:lr = 0.0001251919 (8.170 sec)
INFO:tensorflow:global_step/sec: 12.1377
INFO:tensorflow:loss = 1.2466756, step = 115680 (8.240 sec)
INFO:tensorflow:lr = 0.00012506612 (8.240 sec)
INFO:tensorflow:global_step/sec: 12.202
INFO:tensorflow:loss = 1.2510239, step = 115780 (8.194 sec)
INFO:tensorflow:lr = 0.00012494052 (8.194 sec)
INFO:tensorflow:global_step/sec: 12.4075
INFO:tensorflow:loss = 1.2495364, step = 115880 (8.066 sec)
INFO:tensorflow:lr = 0.000124815 (8.066 sec)
INFO:tensorflow:global_step/sec: 12.1013
INFO:tensorflow:loss = 1.2435124, step = 115980 (8.257 sec)
INFO:tensorflow:lr = 0.00012468963 (8.258 sec)
INFO:tensorflow:global_step/sec: 12.1832
INFO:tensorflow:loss = 1.2507396, step = 116080 (8.216 sec)
INFO:tensorflow:lr = 0.00012456437 (8.216 sec)
INFO:tensorflow:global_step/sec: 12.5537
INFO:tensorflow:loss = 1.2438142, step = 116180 (7.965 sec)
INFO:tensorflow:lr = 0.00012443922 (7.964 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.6062
INFO:tensorflow:loss = 1.2460523, step = 116280 (8.614 sec)
INFO:tensorflow:lr = 0.00012431422 (8.616 sec)
INFO:tensorflow:global_step/sec: 11.1773
INFO:tensorflow:loss = 1.2480481, step = 116380 (8.947 sec)
INFO:tensorflow:lr = 0.00012418936 (8.946 sec)
INFO:tensorflow:global_step/sec: 12.1484
INFO:tensorflow:loss = 1.2447939, step = 116480 (8.233 sec)
INFO:tensorflow:lr = 0.00012406461 (8.232 sec)
INFO:tensorflow:global_step/sec: 12.3809
INFO:tensorflow:loss = 1.2446187, step = 116580 (8.075 sec)
INFO:tensorflow:lr = 0.00012393999 (8.078 sec)
INFO:tensorflow:global_step/sec: 12.4624
INFO:tensorflow:loss = 1.2526968, step = 116680 (8.023 sec)
INFO:tensorflow:lr = 0.00012381548 (8.021 sec)
INFO:tensorflow:global_step/sec: 12.1608
INFO:tensorflow:loss = 1.2439911, step = 116780 (8.221 sec)
INFO:tensorflow:lr = 0.00012369109 (8.219 sec)
INFO:tensorflow:global_step/sec: 12.694
INFO:tensorflow:loss = 1.2494287, step = 116880 (7.878 sec)
INFO:tensorflow:lr = 0.00012356685 (7.878 sec)
INFO:tensorflow:global_step/sec: 12.4984
INFO:tensorflow:loss = 1.2488147, step = 116980 (8.001 sec)
INFO:tensorflow:lr = 0.00012344273 (8.002 sec)
INFO:tensorflow:global_step/sec: 12.1185
INFO:tensorflow:loss = 1.2587779, step = 117080 (8.259 sec)
INFO:tensorflow:lr = 0.00012331874 (8.259 sec)
INFO:tensorflow:global_step/sec: 12.2015
INFO:tensorflow:loss = 1.2470039, step = 117180 (8.188 sec)
INFO:tensorflow:lr = 0.00012319484 (8.187 sec)
INFO:tensorflow:global_step/sec: 12.411
INFO:tensorflow:loss = 1.2492013, step = 117280 (8.059 sec)
INFO:tensorflow:lr = 0.00012307108 (8.063 sec)
INFO:tensorflow:Saving checkpoints for 117360 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2417642.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-117360
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-117360
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.722
INFO:tensorflow:Best (Exact Match) Accuracy: 0.723
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-117360
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 117360 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2482007, step = 117360
INFO:tensorflow:lr = 0.00012297218
INFO:tensorflow:global_step/sec: 9.57093
INFO:tensorflow:loss = 1.2506714, step = 117460 (10.451 sec)
INFO:tensorflow:lr = 0.00012284865 (10.446 sec)
INFO:tensorflow:global_step/sec: 12.0906
INFO:tensorflow:loss = 1.2449813, step = 117560 (8.271 sec)
INFO:tensorflow:lr = 0.00012272525 (8.270 sec)
INFO:tensorflow:global_step/sec: 12.3201
INFO:tensorflow:loss = 1.2460945, step = 117660 (8.116 sec)
INFO:tensorflow:lr = 0.00012260195 (8.116 sec)
INFO:tensorflow:global_step/sec: 12.323
INFO:tensorflow:loss = 1.2516643, step = 117760 (8.121 sec)
INFO:tensorflow:lr = 0.00012247881 (8.127 sec)
INFO:tensorflow:global_step/sec: 12.4119
INFO:tensorflow:loss = 1.2460521, step = 117860 (8.054 sec)
INFO:tensorflow:lr = 0.00012235578 (8.048 sec)
INFO:tensorflow:global_step/sec: 12.5833
INFO:tensorflow:loss = 1.2443562, step = 117960 (7.950 sec)
INFO:tensorflow:lr = 0.00012223287 (7.955 sec)
INFO:tensorflow:global_step/sec: 12.1709
INFO:tensorflow:loss = 1.246166, step = 118060 (8.216 sec)
INFO:tensorflow:lr = 0.00012211008 (8.211 sec)
INFO:tensorflow:global_step/sec: 12.5068
INFO:tensorflow:loss = 1.2477903, step = 118160 (7.995 sec)
INFO:tensorflow:lr = 0.00012198741 (7.995 sec)
INFO:tensorflow:global_step/sec: 12.5401
INFO:tensorflow:loss = 1.2436001, step = 118260 (7.969 sec)
INFO:tensorflow:lr = 0.000121864876 (7.970 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.95747
INFO:tensorflow:loss = 1.2526491, step = 118360 (12.569 sec)
INFO:tensorflow:lr = 0.00012174245 (12.569 sec)
INFO:tensorflow:global_step/sec: 12.5398
INFO:tensorflow:loss = 1.247338, step = 118460 (7.972 sec)
INFO:tensorflow:lr = 0.00012162015 (7.972 sec)
INFO:tensorflow:global_step/sec: 12.5136
INFO:tensorflow:loss = 1.2485074, step = 118560 (7.995 sec)
INFO:tensorflow:lr = 0.000121498 (7.995 sec)
INFO:tensorflow:global_step/sec: 12.5232
INFO:tensorflow:loss = 1.2500961, step = 118660 (7.983 sec)
INFO:tensorflow:lr = 0.00012137595 (7.984 sec)
INFO:tensorflow:global_step/sec: 12.4087
INFO:tensorflow:loss = 1.2486347, step = 118760 (8.059 sec)
INFO:tensorflow:lr = 0.00012125402 (8.060 sec)
INFO:tensorflow:global_step/sec: 12.2352
INFO:tensorflow:loss = 1.2490938, step = 118860 (8.177 sec)
INFO:tensorflow:lr = 0.000121132216 (8.176 sec)
INFO:tensorflow:global_step/sec: 12.2436
INFO:tensorflow:loss = 1.25471, step = 118960 (8.168 sec)
INFO:tensorflow:lr = 0.00012101054 (8.170 sec)
INFO:tensorflow:global_step/sec: 12.4951
INFO:tensorflow:loss = 1.2441717, step = 119060 (7.996 sec)
INFO:tensorflow:lr = 0.000120888995 (7.996 sec)
INFO:tensorflow:global_step/sec: 12.6037
INFO:tensorflow:loss = 1.2489609, step = 119160 (7.934 sec)
INFO:tensorflow:lr = 0.000120767545 (7.933 sec)
INFO:tensorflow:global_step/sec: 12.475
INFO:tensorflow:loss = 1.2471738, step = 119260 (8.016 sec)
INFO:tensorflow:lr = 0.000120646226 (8.017 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.94323
INFO:tensorflow:loss = 1.2460295, step = 119360 (12.589 sec)
INFO:tensorflow:lr = 0.00012052504 (12.587 sec)
INFO:tensorflow:global_step/sec: 12.5354
INFO:tensorflow:loss = 1.2540466, step = 119460 (7.980 sec)
INFO:tensorflow:lr = 0.00012040395 (7.982 sec)
INFO:tensorflow:global_step/sec: 12.617
INFO:tensorflow:loss = 1.2463863, step = 119560 (7.925 sec)
INFO:tensorflow:lr = 0.00012028302 (7.923 sec)
INFO:tensorflow:global_step/sec: 12.2514
INFO:tensorflow:loss = 1.2426605, step = 119660 (8.162 sec)
INFO:tensorflow:lr = 0.0001201622 (8.167 sec)
INFO:tensorflow:global_step/sec: 12.4442
INFO:tensorflow:loss = 1.2469814, step = 119760 (8.039 sec)
INFO:tensorflow:lr = 0.000120041484 (8.034 sec)
INFO:tensorflow:global_step/sec: 12.5949
INFO:tensorflow:loss = 1.2479645, step = 119860 (7.940 sec)
INFO:tensorflow:lr = 0.00011992089 (7.940 sec)
INFO:tensorflow:global_step/sec: 12.3139
INFO:tensorflow:loss = 1.2518939, step = 119960 (8.116 sec)
INFO:tensorflow:lr = 0.00011980043 (8.117 sec)
INFO:tensorflow:global_step/sec: 12.3963
INFO:tensorflow:loss = 1.2455319, step = 120060 (8.067 sec)
INFO:tensorflow:lr = 0.000119680095 (8.066 sec)
INFO:tensorflow:global_step/sec: 12.3853
INFO:tensorflow:loss = 1.2456839, step = 120160 (8.075 sec)
INFO:tensorflow:lr = 0.00011955988 (8.075 sec)
INFO:tensorflow:global_step/sec: 12.1621
INFO:tensorflow:loss = 1.2468312, step = 120260 (8.227 sec)
INFO:tensorflow:lr = 0.00011943976 (8.226 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.16586
INFO:tensorflow:loss = 1.2442948, step = 120360 (12.246 sec)
INFO:tensorflow:lr = 0.0001193198 (12.246 sec)
INFO:tensorflow:global_step/sec: 12.5876
INFO:tensorflow:loss = 1.2436161, step = 120460 (7.939 sec)
INFO:tensorflow:lr = 0.00011919992 (7.940 sec)
INFO:tensorflow:global_step/sec: 12.3838
INFO:tensorflow:loss = 1.2517046, step = 120560 (8.075 sec)
INFO:tensorflow:lr = 0.000119080185 (8.075 sec)
INFO:tensorflow:global_step/sec: 12.4207
INFO:tensorflow:loss = 1.2490052, step = 120660 (8.051 sec)
INFO:tensorflow:lr = 0.00011896058 (8.055 sec)
INFO:tensorflow:global_step/sec: 12.6772
INFO:tensorflow:loss = 1.2606004, step = 120760 (7.894 sec)
INFO:tensorflow:lr = 0.00011884108 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.4873
INFO:tensorflow:loss = 1.2480586, step = 120860 (8.002 sec)
INFO:tensorflow:lr = 0.0001187217 (8.008 sec)
INFO:tensorflow:global_step/sec: 12.4646
INFO:tensorflow:loss = 1.2461877, step = 120960 (8.022 sec)
INFO:tensorflow:lr = 0.00011860243 (8.019 sec)
INFO:tensorflow:global_step/sec: 12.6909
INFO:tensorflow:loss = 1.2459522, step = 121060 (7.885 sec)
INFO:tensorflow:lr = 0.00011848329 (7.882 sec)
INFO:tensorflow:global_step/sec: 12.7884
INFO:tensorflow:loss = 1.2450316, step = 121160 (7.819 sec)
INFO:tensorflow:lr = 0.000118364274 (7.820 sec)
INFO:tensorflow:global_step/sec: 12.5167
INFO:tensorflow:loss = 1.2498332, step = 121260 (7.989 sec)
INFO:tensorflow:lr = 0.00011824537 (7.990 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.42824
INFO:tensorflow:loss = 1.2524766, step = 121360 (11.862 sec)
INFO:tensorflow:lr = 0.00011812659 (11.861 sec)
INFO:tensorflow:global_step/sec: 12.8493
INFO:tensorflow:loss = 1.2486544, step = 121460 (7.781 sec)
INFO:tensorflow:lr = 0.000118007934 (7.782 sec)
INFO:tensorflow:global_step/sec: 12.5805
INFO:tensorflow:loss = 1.2440406, step = 121560 (7.949 sec)
INFO:tensorflow:lr = 0.00011788939 (7.954 sec)
INFO:tensorflow:global_step/sec: 12.2106
INFO:tensorflow:loss = 1.24541, step = 121660 (8.191 sec)
INFO:tensorflow:lr = 0.000117770964 (8.185 sec)
INFO:tensorflow:global_step/sec: 12.734
INFO:tensorflow:loss = 1.244577, step = 121760 (7.858 sec)
INFO:tensorflow:lr = 0.00011765268 (7.857 sec)
INFO:tensorflow:global_step/sec: 12.524
INFO:tensorflow:loss = 1.247097, step = 121860 (7.980 sec)
INFO:tensorflow:lr = 0.000117534466 (7.985 sec)
INFO:tensorflow:global_step/sec: 12.346
INFO:tensorflow:loss = 1.2459865, step = 121960 (8.101 sec)
INFO:tensorflow:lr = 0.000117416406 (8.095 sec)
INFO:tensorflow:global_step/sec: 12.6204
INFO:tensorflow:loss = 1.2476454, step = 122060 (7.929 sec)
INFO:tensorflow:lr = 0.000117298456 (7.933 sec)
INFO:tensorflow:global_step/sec: 12.7997
INFO:tensorflow:loss = 1.2479577, step = 122160 (7.806 sec)
INFO:tensorflow:lr = 0.00011718063 (7.803 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.75356
INFO:tensorflow:loss = 1.2421271, step = 122260 (11.424 sec)
INFO:tensorflow:lr = 0.000117062926 (11.427 sec)
INFO:tensorflow:global_step/sec: 12.6182
INFO:tensorflow:loss = 1.2467126, step = 122360 (7.931 sec)
INFO:tensorflow:lr = 0.000116945324 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.2161
INFO:tensorflow:loss = 1.2463832, step = 122460 (8.180 sec)
INFO:tensorflow:lr = 0.00011682784 (8.180 sec)
INFO:tensorflow:global_step/sec: 12.5557
INFO:tensorflow:loss = 1.2444496, step = 122560 (7.965 sec)
INFO:tensorflow:lr = 0.00011671051 (7.966 sec)
INFO:tensorflow:global_step/sec: 12.56
INFO:tensorflow:loss = 1.2485607, step = 122660 (7.968 sec)
INFO:tensorflow:lr = 0.00011659325 (7.971 sec)
INFO:tensorflow:global_step/sec: 12.5083
INFO:tensorflow:loss = 1.2494316, step = 122760 (7.990 sec)
INFO:tensorflow:lr = 0.00011647614 (7.986 sec)
INFO:tensorflow:global_step/sec: 12.8594
INFO:tensorflow:loss = 1.2474501, step = 122860 (7.781 sec)
INFO:tensorflow:lr = 0.00011635912 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.7281
INFO:tensorflow:loss = 1.2478578, step = 122960 (7.856 sec)
INFO:tensorflow:lr = 0.00011624224 (7.857 sec)
INFO:tensorflow:global_step/sec: 12.8408
INFO:tensorflow:loss = 1.2520856, step = 123060 (7.783 sec)
INFO:tensorflow:lr = 0.000116125484 (7.782 sec)
INFO:tensorflow:global_step/sec: 12.8542
INFO:tensorflow:loss = 1.2521843, step = 123160 (7.782 sec)
INFO:tensorflow:lr = 0.00011600883 (7.782 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.06857
INFO:tensorflow:loss = 1.2535832, step = 123260 (11.027 sec)
INFO:tensorflow:lr = 0.0001158923 (11.027 sec)
INFO:tensorflow:global_step/sec: 12.9486
INFO:tensorflow:loss = 1.249761, step = 123360 (7.720 sec)
INFO:tensorflow:lr = 0.00011577587 (7.720 sec)
INFO:tensorflow:global_step/sec: 12.4898
INFO:tensorflow:loss = 1.2453451, step = 123460 (8.013 sec)
INFO:tensorflow:lr = 0.00011565958 (8.013 sec)
INFO:tensorflow:global_step/sec: 12.6435
INFO:tensorflow:loss = 1.2508979, step = 123560 (7.908 sec)
INFO:tensorflow:lr = 0.0001155434 (7.908 sec)
INFO:tensorflow:global_step/sec: 12.5327
INFO:tensorflow:loss = 1.24587, step = 123660 (7.974 sec)
INFO:tensorflow:lr = 0.000115427334 (7.975 sec)
INFO:tensorflow:global_step/sec: 12.9855
INFO:tensorflow:loss = 1.2542604, step = 123760 (7.701 sec)
INFO:tensorflow:lr = 0.000115311384 (7.701 sec)
INFO:tensorflow:global_step/sec: 12.8748
INFO:tensorflow:loss = 1.244994, step = 123860 (7.767 sec)
INFO:tensorflow:lr = 0.000115195544 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.2358
INFO:tensorflow:loss = 1.2472664, step = 123960 (8.173 sec)
INFO:tensorflow:lr = 0.00011507982 (8.172 sec)
INFO:tensorflow:global_step/sec: 12.6827
INFO:tensorflow:loss = 1.2551069, step = 124060 (7.890 sec)
INFO:tensorflow:lr = 0.000114964234 (7.888 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0551
INFO:tensorflow:loss = 1.2484986, step = 124160 (8.296 sec)
INFO:tensorflow:lr = 0.00011484874 (8.297 sec)
INFO:tensorflow:global_step/sec: 10.5292
INFO:tensorflow:loss = 1.2491708, step = 124260 (9.497 sec)
INFO:tensorflow:lr = 0.00011473338 (9.496 sec)
INFO:tensorflow:global_step/sec: 12.902
INFO:tensorflow:loss = 1.2463233, step = 124360 (7.745 sec)
INFO:tensorflow:lr = 0.00011461812 (7.746 sec)
INFO:tensorflow:global_step/sec: 12.766
INFO:tensorflow:loss = 1.2511879, step = 124460 (7.837 sec)
INFO:tensorflow:lr = 0.000114502975 (7.838 sec)
INFO:tensorflow:global_step/sec: 12.7431
INFO:tensorflow:loss = 1.2464348, step = 124560 (7.845 sec)
INFO:tensorflow:lr = 0.00011438796 (7.845 sec)
INFO:tensorflow:global_step/sec: 12.3308
INFO:tensorflow:loss = 1.2550204, step = 124660 (8.114 sec)
INFO:tensorflow:lr = 0.000114273054 (8.113 sec)
INFO:tensorflow:global_step/sec: 12.6927
INFO:tensorflow:loss = 1.2458317, step = 124760 (7.879 sec)
INFO:tensorflow:lr = 0.00011415826 (7.880 sec)
INFO:tensorflow:global_step/sec: 12.6561
INFO:tensorflow:loss = 1.2493947, step = 124860 (7.900 sec)
INFO:tensorflow:lr = 0.00011404359 (7.900 sec)
INFO:tensorflow:global_step/sec: 12.6385
INFO:tensorflow:loss = 1.2473803, step = 124960 (7.912 sec)
INFO:tensorflow:lr = 0.00011392903 (7.912 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2313
INFO:tensorflow:loss = 1.2489656, step = 125060 (8.177 sec)
INFO:tensorflow:lr = 0.000113814574 (8.181 sec)
INFO:tensorflow:global_step/sec: 10.8729
INFO:tensorflow:loss = 1.2458106, step = 125160 (9.195 sec)
INFO:tensorflow:lr = 0.00011370025 (9.192 sec)
INFO:tensorflow:global_step/sec: 12.9656
INFO:tensorflow:loss = 1.245927, step = 125260 (7.709 sec)
INFO:tensorflow:lr = 0.000113586044 (7.712 sec)
INFO:tensorflow:global_step/sec: 12.8824
INFO:tensorflow:loss = 1.245289, step = 125360 (7.763 sec)
INFO:tensorflow:lr = 0.000113471935 (7.760 sec)
INFO:tensorflow:global_step/sec: 12.6135
INFO:tensorflow:loss = 1.244993, step = 125460 (7.928 sec)
INFO:tensorflow:lr = 0.00011335795 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.6983
INFO:tensorflow:loss = 1.246616, step = 125560 (7.875 sec)
INFO:tensorflow:lr = 0.00011324408 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.7768
INFO:tensorflow:loss = 1.243581, step = 125660 (7.830 sec)
INFO:tensorflow:lr = 0.000113130314 (7.830 sec)
INFO:tensorflow:global_step/sec: 12.5408
INFO:tensorflow:loss = 1.2462535, step = 125760 (7.975 sec)
INFO:tensorflow:lr = 0.00011301667 (7.976 sec)
INFO:tensorflow:global_step/sec: 12.7577
INFO:tensorflow:loss = 1.2469722, step = 125860 (7.834 sec)
INFO:tensorflow:lr = 0.00011290314 (7.837 sec)
INFO:tensorflow:global_step/sec: 12.811
INFO:tensorflow:loss = 1.2492265, step = 125960 (7.806 sec)
INFO:tensorflow:lr = 0.00011278975 (7.802 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0305
INFO:tensorflow:loss = 1.2433882, step = 126060 (8.318 sec)
INFO:tensorflow:lr = 0.00011267645 (8.320 sec)
INFO:tensorflow:global_step/sec: 11.1724
INFO:tensorflow:loss = 1.2503134, step = 126160 (8.950 sec)
INFO:tensorflow:lr = 0.00011256325 (8.948 sec)
INFO:tensorflow:global_step/sec: 12.5939
INFO:tensorflow:loss = 1.2438878, step = 126260 (7.936 sec)
INFO:tensorflow:lr = 0.00011245018 (7.937 sec)
INFO:tensorflow:global_step/sec: 12.5034
INFO:tensorflow:loss = 1.2491252, step = 126360 (7.995 sec)
INFO:tensorflow:lr = 0.00011233722 (7.994 sec)
INFO:tensorflow:global_step/sec: 12.7607
INFO:tensorflow:loss = 1.2450532, step = 126460 (7.837 sec)
INFO:tensorflow:lr = 0.00011222437 (7.837 sec)
INFO:tensorflow:global_step/sec: 12.9278
INFO:tensorflow:loss = 1.2452111, step = 126560 (7.740 sec)
INFO:tensorflow:lr = 0.00011211164 (7.740 sec)
INFO:tensorflow:global_step/sec: 12.5386
INFO:tensorflow:loss = 1.2478788, step = 126660 (7.971 sec)
INFO:tensorflow:lr = 0.00011199902 (7.971 sec)
INFO:tensorflow:global_step/sec: 12.885
INFO:tensorflow:loss = 1.2447201, step = 126760 (7.761 sec)
INFO:tensorflow:lr = 0.00011188651 (7.766 sec)
INFO:tensorflow:global_step/sec: 12.4045
INFO:tensorflow:loss = 1.2440642, step = 126860 (8.065 sec)
INFO:tensorflow:lr = 0.000111774105 (8.060 sec)
INFO:tensorflow:global_step/sec: 12.7656
INFO:tensorflow:loss = 1.2417755, step = 126960 (7.830 sec)
INFO:tensorflow:lr = 0.00011166184 (7.830 sec)
INFO:tensorflow:global_step/sec: 12.4535
INFO:tensorflow:loss = 1.2505175, step = 127060 (8.031 sec)
INFO:tensorflow:lr = 0.00011154967 (8.031 sec)
INFO:tensorflow:Saving checkpoints for 127140 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2458371.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-127140
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-127140
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.724
INFO:tensorflow:Best (Exact Match) Accuracy: 0.724
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-127140
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 127140 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2435741, step = 127140
INFO:tensorflow:lr = 0.000111460016
INFO:tensorflow:global_step/sec: 10.2235
INFO:tensorflow:loss = 1.2465057, step = 127240 (9.783 sec)
INFO:tensorflow:lr = 0.000111348054 (9.788 sec)
INFO:tensorflow:global_step/sec: 12.5664
INFO:tensorflow:loss = 1.2451212, step = 127340 (7.958 sec)
INFO:tensorflow:lr = 0.0001112362 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.5336
INFO:tensorflow:loss = 1.2496941, step = 127440 (7.979 sec)
INFO:tensorflow:lr = 0.000111124464 (7.979 sec)
INFO:tensorflow:global_step/sec: 12.8346
INFO:tensorflow:loss = 1.2417659, step = 127540 (7.791 sec)
INFO:tensorflow:lr = 0.000111012836 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.6779
INFO:tensorflow:loss = 1.2437657, step = 127640 (7.892 sec)
INFO:tensorflow:lr = 0.00011090133 (7.895 sec)
INFO:tensorflow:global_step/sec: 12.7347
INFO:tensorflow:loss = 1.2443695, step = 127740 (7.848 sec)
INFO:tensorflow:lr = 0.000110789915 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.4271
INFO:tensorflow:loss = 1.2493587, step = 127840 (8.049 sec)
INFO:tensorflow:lr = 0.00011067862 (8.051 sec)
INFO:tensorflow:global_step/sec: 12.5781
INFO:tensorflow:loss = 1.2441834, step = 127940 (7.953 sec)
INFO:tensorflow:lr = 0.00011056746 (7.951 sec)
INFO:tensorflow:global_step/sec: 12.8326
INFO:tensorflow:loss = 1.2549399, step = 128040 (7.792 sec)
INFO:tensorflow:lr = 0.00011045637 (7.792 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.24998
INFO:tensorflow:loss = 1.2466215, step = 128140 (12.121 sec)
INFO:tensorflow:lr = 0.00011034542 (12.123 sec)
INFO:tensorflow:global_step/sec: 12.5389
INFO:tensorflow:loss = 1.2452357, step = 128240 (7.971 sec)
INFO:tensorflow:lr = 0.00011023458 (7.974 sec)
INFO:tensorflow:global_step/sec: 12.4399
INFO:tensorflow:loss = 1.2436724, step = 128340 (8.043 sec)
INFO:tensorflow:lr = 0.00011012384 (8.039 sec)
INFO:tensorflow:global_step/sec: 12.2715
INFO:tensorflow:loss = 1.2544248, step = 128440 (8.145 sec)
INFO:tensorflow:lr = 0.00011001323 (8.145 sec)
INFO:tensorflow:global_step/sec: 12.527
INFO:tensorflow:loss = 1.2489731, step = 128540 (7.989 sec)
INFO:tensorflow:lr = 0.0001099027 (7.989 sec)
INFO:tensorflow:global_step/sec: 12.6973
INFO:tensorflow:loss = 1.2446793, step = 128640 (7.874 sec)
INFO:tensorflow:lr = 0.000109792316 (7.876 sec)
INFO:tensorflow:global_step/sec: 12.4341
INFO:tensorflow:loss = 1.2533972, step = 128740 (8.037 sec)
INFO:tensorflow:lr = 0.00010968202 (8.036 sec)
INFO:tensorflow:global_step/sec: 12.5414
INFO:tensorflow:loss = 1.2431896, step = 128840 (7.974 sec)
INFO:tensorflow:lr = 0.00010957183 (7.974 sec)
INFO:tensorflow:global_step/sec: 12.3855
INFO:tensorflow:loss = 1.2443397, step = 128940 (8.080 sec)
INFO:tensorflow:lr = 0.00010946177 (8.080 sec)
INFO:tensorflow:global_step/sec: 12.488
INFO:tensorflow:loss = 1.244244, step = 129040 (8.002 sec)
INFO:tensorflow:lr = 0.00010935181 (8.003 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.07857
INFO:tensorflow:loss = 1.2466154, step = 129140 (12.382 sec)
INFO:tensorflow:lr = 0.00010924197 (12.382 sec)
INFO:tensorflow:global_step/sec: 12.3629
INFO:tensorflow:loss = 1.2436008, step = 129240 (8.086 sec)
INFO:tensorflow:lr = 0.00010913224 (8.086 sec)
INFO:tensorflow:global_step/sec: 12.295
INFO:tensorflow:loss = 1.2524009, step = 129340 (8.135 sec)
INFO:tensorflow:lr = 0.00010902259 (8.135 sec)
INFO:tensorflow:global_step/sec: 12.3022
INFO:tensorflow:loss = 1.244007, step = 129440 (8.129 sec)
INFO:tensorflow:lr = 0.00010891308 (8.129 sec)
INFO:tensorflow:global_step/sec: 12.4037
INFO:tensorflow:loss = 1.2510656, step = 129540 (8.064 sec)
INFO:tensorflow:lr = 0.00010880369 (8.063 sec)
INFO:tensorflow:global_step/sec: 12.3284
INFO:tensorflow:loss = 1.2440971, step = 129640 (8.111 sec)
INFO:tensorflow:lr = 0.000108694396 (8.111 sec)
INFO:tensorflow:global_step/sec: 12.1042
INFO:tensorflow:loss = 1.2430845, step = 129740 (8.262 sec)
INFO:tensorflow:lr = 0.00010858521 (8.262 sec)
INFO:tensorflow:global_step/sec: 12.1477
INFO:tensorflow:loss = 1.2497059, step = 129840 (8.226 sec)
INFO:tensorflow:lr = 0.000108476124 (8.227 sec)
INFO:tensorflow:global_step/sec: 12.1074
INFO:tensorflow:loss = 1.2511698, step = 129940 (8.260 sec)
INFO:tensorflow:lr = 0.00010836717 (8.258 sec)
INFO:tensorflow:global_step/sec: 12.6255
INFO:tensorflow:loss = 1.2424986, step = 130040 (7.926 sec)
INFO:tensorflow:lr = 0.000108258304 (7.927 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.91354
INFO:tensorflow:loss = 1.2430753, step = 130140 (12.632 sec)
INFO:tensorflow:lr = 0.000108149565 (12.635 sec)
INFO:tensorflow:global_step/sec: 12.3666
INFO:tensorflow:loss = 1.2508368, step = 130240 (8.087 sec)
INFO:tensorflow:lr = 0.00010804091 (8.087 sec)
INFO:tensorflow:global_step/sec: 12.3495
INFO:tensorflow:loss = 1.2460352, step = 130340 (8.097 sec)
INFO:tensorflow:lr = 0.00010793238 (8.092 sec)
INFO:tensorflow:global_step/sec: 12.2387
INFO:tensorflow:loss = 1.2445351, step = 130440 (8.175 sec)
INFO:tensorflow:lr = 0.000107823966 (8.175 sec)
INFO:tensorflow:global_step/sec: 12.2714
INFO:tensorflow:loss = 1.24298, step = 130540 (8.144 sec)
INFO:tensorflow:lr = 0.00010771565 (8.149 sec)
INFO:tensorflow:global_step/sec: 12.2735
INFO:tensorflow:loss = 1.2450466, step = 130640 (8.149 sec)
INFO:tensorflow:lr = 0.000107607455 (8.145 sec)
INFO:tensorflow:global_step/sec: 12.2928
INFO:tensorflow:loss = 1.2488058, step = 130740 (8.135 sec)
INFO:tensorflow:lr = 0.00010749935 (8.136 sec)
INFO:tensorflow:global_step/sec: 12.1511
INFO:tensorflow:loss = 1.2458876, step = 130840 (8.228 sec)
INFO:tensorflow:lr = 0.00010739135 (8.227 sec)
INFO:tensorflow:global_step/sec: 12.4498
INFO:tensorflow:loss = 1.2464055, step = 130940 (8.038 sec)
INFO:tensorflow:lr = 0.00010728349 (8.038 sec)
INFO:tensorflow:global_step/sec: 12.5961
INFO:tensorflow:loss = 1.2468756, step = 131040 (7.933 sec)
INFO:tensorflow:lr = 0.000107175714 (7.934 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.15478
INFO:tensorflow:loss = 1.2451632, step = 131140 (12.266 sec)
INFO:tensorflow:lr = 0.000107068074 (12.265 sec)
INFO:tensorflow:global_step/sec: 12.3205
INFO:tensorflow:loss = 1.2453297, step = 131240 (8.116 sec)
INFO:tensorflow:lr = 0.0001069605 (8.117 sec)
INFO:tensorflow:global_step/sec: 11.9643
INFO:tensorflow:loss = 1.2488296, step = 131340 (8.361 sec)
INFO:tensorflow:lr = 0.000106853055 (8.360 sec)
INFO:tensorflow:global_step/sec: 12.4314
INFO:tensorflow:loss = 1.2435274, step = 131440 (8.043 sec)
INFO:tensorflow:lr = 0.00010674573 (8.043 sec)
INFO:tensorflow:global_step/sec: 12.0054
INFO:tensorflow:loss = 1.245277, step = 131540 (8.327 sec)
INFO:tensorflow:lr = 0.0001066385 (8.328 sec)
INFO:tensorflow:global_step/sec: 12.2444
INFO:tensorflow:loss = 1.243785, step = 131640 (8.168 sec)
INFO:tensorflow:lr = 0.00010653138 (8.172 sec)
INFO:tensorflow:global_step/sec: 12.2932
INFO:tensorflow:loss = 1.248311, step = 131740 (8.131 sec)
INFO:tensorflow:lr = 0.00010642436 (8.126 sec)
INFO:tensorflow:global_step/sec: 12.3766
INFO:tensorflow:loss = 1.2436168, step = 131840 (8.086 sec)
INFO:tensorflow:lr = 0.00010631745 (8.086 sec)
INFO:tensorflow:global_step/sec: 12.3664
INFO:tensorflow:loss = 1.2433931, step = 131940 (8.088 sec)
INFO:tensorflow:lr = 0.00010621067 (8.088 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.14088
INFO:tensorflow:loss = 1.246407, step = 132040 (12.280 sec)
INFO:tensorflow:lr = 0.00010610395 (12.281 sec)
INFO:tensorflow:global_step/sec: 12.2325
INFO:tensorflow:loss = 1.2487501, step = 132140 (8.171 sec)
INFO:tensorflow:lr = 0.00010599738 (8.171 sec)
INFO:tensorflow:global_step/sec: 12.167
INFO:tensorflow:loss = 1.2465798, step = 132240 (8.220 sec)
INFO:tensorflow:lr = 0.000105890904 (8.219 sec)
INFO:tensorflow:global_step/sec: 12.1129
INFO:tensorflow:loss = 1.2428634, step = 132340 (8.257 sec)
INFO:tensorflow:lr = 0.00010578453 (8.258 sec)
INFO:tensorflow:global_step/sec: 12.1236
INFO:tensorflow:loss = 1.248153, step = 132440 (8.246 sec)
INFO:tensorflow:lr = 0.00010567827 (8.250 sec)
INFO:tensorflow:global_step/sec: 12.2855
INFO:tensorflow:loss = 1.2455584, step = 132540 (8.139 sec)
INFO:tensorflow:lr = 0.0001055721 (8.135 sec)
INFO:tensorflow:global_step/sec: 12.1064
INFO:tensorflow:loss = 1.244128, step = 132640 (8.263 sec)
INFO:tensorflow:lr = 0.00010546607 (8.263 sec)
INFO:tensorflow:global_step/sec: 12.0689
INFO:tensorflow:loss = 1.2437512, step = 132740 (8.283 sec)
INFO:tensorflow:lr = 0.00010536012 (8.283 sec)
INFO:tensorflow:global_step/sec: 12.582
INFO:tensorflow:loss = 1.2527406, step = 132840 (7.953 sec)
INFO:tensorflow:lr = 0.00010525428 (7.960 sec)
INFO:tensorflow:global_step/sec: 12.4056
INFO:tensorflow:loss = 1.2459419, step = 132940 (8.061 sec)
INFO:tensorflow:lr = 0.00010514854 (8.055 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.60371
INFO:tensorflow:loss = 1.2440192, step = 133040 (11.618 sec)
INFO:tensorflow:lr = 0.00010504292 (11.617 sec)
INFO:tensorflow:global_step/sec: 12.3615
INFO:tensorflow:loss = 1.246831, step = 133140 (8.095 sec)
INFO:tensorflow:lr = 0.000104937404 (8.096 sec)
INFO:tensorflow:global_step/sec: 12.1262
INFO:tensorflow:loss = 1.2434736, step = 133240 (8.243 sec)
INFO:tensorflow:lr = 0.00010483199 (8.244 sec)
INFO:tensorflow:global_step/sec: 11.9553
INFO:tensorflow:loss = 1.2503418, step = 133340 (8.365 sec)
INFO:tensorflow:lr = 0.00010472667 (8.364 sec)
INFO:tensorflow:global_step/sec: 11.8907
INFO:tensorflow:loss = 1.2424436, step = 133440 (8.409 sec)
INFO:tensorflow:lr = 0.00010462148 (8.408 sec)
INFO:tensorflow:global_step/sec: 12.2531
INFO:tensorflow:loss = 1.2495891, step = 133540 (8.160 sec)
INFO:tensorflow:lr = 0.000104516395 (8.160 sec)
INFO:tensorflow:global_step/sec: 12.2438
INFO:tensorflow:loss = 1.2514443, step = 133640 (8.172 sec)
INFO:tensorflow:lr = 0.00010441141 (8.174 sec)
INFO:tensorflow:global_step/sec: 12.1721
INFO:tensorflow:loss = 1.2426683, step = 133740 (8.216 sec)
INFO:tensorflow:lr = 0.00010430651 (8.216 sec)
INFO:tensorflow:global_step/sec: 12.3861
INFO:tensorflow:loss = 1.2496032, step = 133840 (8.072 sec)
INFO:tensorflow:lr = 0.00010420173 (8.072 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.7193
INFO:tensorflow:loss = 1.2486618, step = 133940 (8.536 sec)
INFO:tensorflow:lr = 0.00010409707 (8.537 sec)
INFO:tensorflow:global_step/sec: 10.1707
INFO:tensorflow:loss = 1.2442518, step = 134040 (9.830 sec)
INFO:tensorflow:lr = 0.0001039925 (9.829 sec)
INFO:tensorflow:global_step/sec: 12.3223
INFO:tensorflow:loss = 1.2536051, step = 134140 (8.114 sec)
INFO:tensorflow:lr = 0.00010388803 (8.115 sec)
INFO:tensorflow:global_step/sec: 12.4179
INFO:tensorflow:loss = 1.2437172, step = 134240 (8.052 sec)
INFO:tensorflow:lr = 0.00010378366 (8.053 sec)
INFO:tensorflow:global_step/sec: 12.2421
INFO:tensorflow:loss = 1.243759, step = 134340 (8.171 sec)
INFO:tensorflow:lr = 0.000103679406 (8.169 sec)
INFO:tensorflow:global_step/sec: 12.1969
INFO:tensorflow:loss = 1.2443966, step = 134440 (8.194 sec)
INFO:tensorflow:lr = 0.000103575265 (8.195 sec)
INFO:tensorflow:global_step/sec: 12.5337
INFO:tensorflow:loss = 1.2484913, step = 134540 (7.979 sec)
INFO:tensorflow:lr = 0.000103471226 (7.979 sec)
INFO:tensorflow:global_step/sec: 12.4363
INFO:tensorflow:loss = 1.2449461, step = 134640 (8.041 sec)
INFO:tensorflow:lr = 0.00010336729 (8.041 sec)
INFO:tensorflow:global_step/sec: 12.1351
INFO:tensorflow:loss = 1.2493279, step = 134740 (8.239 sec)
INFO:tensorflow:lr = 0.00010326345 (8.239 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.9634
INFO:tensorflow:loss = 1.246514, step = 134840 (8.360 sec)
INFO:tensorflow:lr = 0.00010315971 (8.363 sec)
INFO:tensorflow:global_step/sec: 10.6141
INFO:tensorflow:loss = 1.2479151, step = 134940 (9.421 sec)
INFO:tensorflow:lr = 0.000103056096 (9.418 sec)
INFO:tensorflow:global_step/sec: 12.1932
INFO:tensorflow:loss = 1.2446302, step = 135040 (8.205 sec)
INFO:tensorflow:lr = 0.000102952574 (8.206 sec)
INFO:tensorflow:global_step/sec: 12.3143
INFO:tensorflow:loss = 1.2450219, step = 135140 (8.120 sec)
INFO:tensorflow:lr = 0.00010284917 (8.119 sec)
INFO:tensorflow:global_step/sec: 12.2555
INFO:tensorflow:loss = 1.2433691, step = 135240 (8.155 sec)
INFO:tensorflow:lr = 0.00010274584 (8.155 sec)
INFO:tensorflow:global_step/sec: 12.2253
INFO:tensorflow:loss = 1.2495849, step = 135340 (8.180 sec)
INFO:tensorflow:lr = 0.00010264262 (8.180 sec)
INFO:tensorflow:global_step/sec: 12.225
INFO:tensorflow:loss = 1.2457464, step = 135440 (8.185 sec)
INFO:tensorflow:lr = 0.000102539525 (8.185 sec)
INFO:tensorflow:global_step/sec: 12.3318
INFO:tensorflow:loss = 1.2438371, step = 135540 (8.107 sec)
INFO:tensorflow:lr = 0.00010243652 (8.107 sec)
INFO:tensorflow:global_step/sec: 12.4329
INFO:tensorflow:loss = 1.2439129, step = 135640 (8.047 sec)
INFO:tensorflow:lr = 0.000102333615 (8.047 sec)
INFO:tensorflow:global_step/sec: 12.4265
INFO:tensorflow:loss = 1.2445234, step = 135740 (8.041 sec)
INFO:tensorflow:lr = 0.00010223082 (8.042 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.3109
INFO:tensorflow:loss = 1.247158, step = 135840 (8.856 sec)
INFO:tensorflow:lr = 0.00010212812 (8.856 sec)
INFO:tensorflow:global_step/sec: 10.9069
INFO:tensorflow:loss = 1.2456703, step = 135940 (9.154 sec)
INFO:tensorflow:lr = 0.000102025544 (9.158 sec)
INFO:tensorflow:global_step/sec: 12.004
INFO:tensorflow:loss = 1.249978, step = 136040 (8.336 sec)
INFO:tensorflow:lr = 0.00010192303 (8.331 sec)
INFO:tensorflow:global_step/sec: 12.3161
INFO:tensorflow:loss = 1.2440797, step = 136140 (8.115 sec)
INFO:tensorflow:lr = 0.00010182066 (8.115 sec)
INFO:tensorflow:global_step/sec: 12.4287
INFO:tensorflow:loss = 1.2494134, step = 136240 (8.046 sec)
INFO:tensorflow:lr = 0.000101718375 (8.046 sec)
INFO:tensorflow:global_step/sec: 12.2461
INFO:tensorflow:loss = 1.2424796, step = 136340 (8.169 sec)
INFO:tensorflow:lr = 0.0001016162 (8.171 sec)
INFO:tensorflow:global_step/sec: 12.1615
INFO:tensorflow:loss = 1.2436228, step = 136440 (8.224 sec)
INFO:tensorflow:lr = 0.00010151413 (8.221 sec)
INFO:tensorflow:global_step/sec: 12.4358
INFO:tensorflow:loss = 1.2450893, step = 136540 (8.037 sec)
INFO:tensorflow:lr = 0.00010141214 (8.038 sec)
INFO:tensorflow:global_step/sec: 12.3499
INFO:tensorflow:loss = 1.2470615, step = 136640 (8.102 sec)
INFO:tensorflow:lr = 0.000101310274 (8.101 sec)
INFO:tensorflow:global_step/sec: 12.0695
INFO:tensorflow:loss = 1.2428521, step = 136740 (8.283 sec)
INFO:tensorflow:lr = 0.000101208505 (8.284 sec)
INFO:tensorflow:global_step/sec: 12.4794
INFO:tensorflow:loss = 1.243703, step = 136840 (8.011 sec)
INFO:tensorflow:lr = 0.000101106845 (8.011 sec)
INFO:tensorflow:Saving checkpoints for 136920 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2554393.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-136920
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-136920
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.723
INFO:tensorflow:Best (Exact Match) Accuracy: 0.724
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-136920
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 136920 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2442503, step = 136920
INFO:tensorflow:lr = 0.00010102558
INFO:tensorflow:global_step/sec: 9.49728
INFO:tensorflow:loss = 1.2426513, step = 137020 (10.534 sec)
INFO:tensorflow:lr = 0.00010092411 (10.534 sec)
INFO:tensorflow:global_step/sec: 12.1446
INFO:tensorflow:loss = 1.2465923, step = 137120 (8.235 sec)
INFO:tensorflow:lr = 0.00010082272 (8.235 sec)
INFO:tensorflow:global_step/sec: 12.0058
INFO:tensorflow:loss = 1.2437319, step = 137220 (8.331 sec)
INFO:tensorflow:lr = 0.00010072145 (8.333 sec)
INFO:tensorflow:global_step/sec: 12.1429
INFO:tensorflow:loss = 1.2430804, step = 137320 (8.237 sec)
INFO:tensorflow:lr = 0.000100620266 (8.234 sec)
INFO:tensorflow:global_step/sec: 11.9963
INFO:tensorflow:loss = 1.2503809, step = 137420 (8.329 sec)
INFO:tensorflow:lr = 0.00010051919 (8.330 sec)
INFO:tensorflow:global_step/sec: 11.9954
INFO:tensorflow:loss = 1.245267, step = 137520 (8.336 sec)
INFO:tensorflow:lr = 0.00010041822 (8.345 sec)
INFO:tensorflow:global_step/sec: 12.0687
INFO:tensorflow:loss = 1.244724, step = 137620 (8.290 sec)
INFO:tensorflow:lr = 0.00010031733 (8.283 sec)
INFO:tensorflow:global_step/sec: 12.3354
INFO:tensorflow:loss = 1.2446139, step = 137720 (8.108 sec)
INFO:tensorflow:lr = 0.000100216566 (8.107 sec)
INFO:tensorflow:global_step/sec: 12.2787
INFO:tensorflow:loss = 1.2453194, step = 137820 (8.139 sec)
INFO:tensorflow:lr = 0.0001001159 (8.138 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.83209
INFO:tensorflow:loss = 1.2472328, step = 137920 (12.767 sec)
INFO:tensorflow:lr = 0.00010001531 (12.769 sec)
INFO:tensorflow:global_step/sec: 12.1816
INFO:tensorflow:loss = 1.2472757, step = 138020 (8.214 sec)
INFO:tensorflow:lr = 9.991486e-05 (8.212 sec)
INFO:tensorflow:global_step/sec: 12.2596
INFO:tensorflow:loss = 1.2465109, step = 138120 (8.152 sec)
INFO:tensorflow:lr = 9.981449e-05 (8.158 sec)
INFO:tensorflow:global_step/sec: 12.3647
INFO:tensorflow:loss = 1.2436755, step = 138220 (8.094 sec)
INFO:tensorflow:lr = 9.971423e-05 (8.088 sec)
INFO:tensorflow:global_step/sec: 12.373
INFO:tensorflow:loss = 1.2455561, step = 138320 (8.083 sec)
INFO:tensorflow:lr = 9.961406e-05 (8.086 sec)
INFO:tensorflow:global_step/sec: 12.1114
INFO:tensorflow:loss = 1.2426962, step = 138420 (8.256 sec)
INFO:tensorflow:lr = 9.9513985e-05 (8.254 sec)
INFO:tensorflow:global_step/sec: 12.3349
INFO:tensorflow:loss = 1.2463111, step = 138520 (8.101 sec)
INFO:tensorflow:lr = 9.9414036e-05 (8.105 sec)
INFO:tensorflow:global_step/sec: 12.0076
INFO:tensorflow:loss = 1.2430253, step = 138620 (8.328 sec)
INFO:tensorflow:lr = 9.9314166e-05 (8.329 sec)
INFO:tensorflow:global_step/sec: 12.1418
INFO:tensorflow:loss = 1.2426336, step = 138720 (8.243 sec)
INFO:tensorflow:lr = 9.9214405e-05 (8.238 sec)
INFO:tensorflow:global_step/sec: 12.0151
INFO:tensorflow:loss = 1.2564312, step = 138820 (8.317 sec)
INFO:tensorflow:lr = 9.911473e-05 (8.316 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.72
INFO:tensorflow:loss = 1.2428147, step = 138920 (12.956 sec)
INFO:tensorflow:lr = 9.901517e-05 (12.958 sec)
INFO:tensorflow:global_step/sec: 12.1405
INFO:tensorflow:loss = 1.2480109, step = 139020 (8.235 sec)
INFO:tensorflow:lr = 9.891571e-05 (8.235 sec)
INFO:tensorflow:global_step/sec: 12.1696
INFO:tensorflow:loss = 1.2434272, step = 139120 (8.221 sec)
INFO:tensorflow:lr = 9.8816345e-05 (8.220 sec)
INFO:tensorflow:global_step/sec: 12.3821
INFO:tensorflow:loss = 1.2433711, step = 139220 (8.073 sec)
INFO:tensorflow:lr = 9.871709e-05 (8.073 sec)
INFO:tensorflow:global_step/sec: 11.899
INFO:tensorflow:loss = 1.2432872, step = 139320 (8.402 sec)
INFO:tensorflow:lr = 9.861792e-05 (8.401 sec)
INFO:tensorflow:global_step/sec: 12.294
INFO:tensorflow:loss = 1.2443063, step = 139420 (8.140 sec)
INFO:tensorflow:lr = 9.8518845e-05 (8.140 sec)
INFO:tensorflow:global_step/sec: 11.9733
INFO:tensorflow:loss = 1.2486244, step = 139520 (8.351 sec)
INFO:tensorflow:lr = 9.841989e-05 (8.351 sec)
INFO:tensorflow:global_step/sec: 12.3805
INFO:tensorflow:loss = 1.2429479, step = 139620 (8.074 sec)
INFO:tensorflow:lr = 9.832102e-05 (8.075 sec)
INFO:tensorflow:global_step/sec: 12.2166
INFO:tensorflow:loss = 1.2444541, step = 139720 (8.189 sec)
INFO:tensorflow:lr = 9.822226e-05 (8.189 sec)
INFO:tensorflow:global_step/sec: 12.0897
INFO:tensorflow:loss = 1.2436047, step = 139820 (8.271 sec)
INFO:tensorflow:lr = 9.8123586e-05 (8.271 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.94567
INFO:tensorflow:loss = 1.2447098, step = 139920 (12.585 sec)
INFO:tensorflow:lr = 9.802502e-05 (12.584 sec)
INFO:tensorflow:global_step/sec: 12.1545
INFO:tensorflow:loss = 1.2488983, step = 140020 (8.230 sec)
INFO:tensorflow:lr = 9.792656e-05 (8.232 sec)
INFO:tensorflow:global_step/sec: 12.3331
INFO:tensorflow:loss = 1.2468932, step = 140120 (8.102 sec)
INFO:tensorflow:lr = 9.782818e-05 (8.103 sec)
INFO:tensorflow:global_step/sec: 12.1976
INFO:tensorflow:loss = 1.2424612, step = 140220 (8.202 sec)
INFO:tensorflow:lr = 9.772992e-05 (8.198 sec)
INFO:tensorflow:global_step/sec: 12.1431
INFO:tensorflow:loss = 1.245854, step = 140320 (8.232 sec)
INFO:tensorflow:lr = 9.763174e-05 (8.232 sec)
INFO:tensorflow:global_step/sec: 12.2553
INFO:tensorflow:loss = 1.2430899, step = 140420 (8.160 sec)
INFO:tensorflow:lr = 9.753366e-05 (8.162 sec)
INFO:tensorflow:global_step/sec: 12.3075
INFO:tensorflow:loss = 1.2432994, step = 140520 (8.129 sec)
INFO:tensorflow:lr = 9.7435695e-05 (8.127 sec)
INFO:tensorflow:global_step/sec: 12.2089
INFO:tensorflow:loss = 1.2422528, step = 140620 (8.190 sec)
INFO:tensorflow:lr = 9.733782e-05 (8.189 sec)
INFO:tensorflow:global_step/sec: 12.4876
INFO:tensorflow:loss = 1.2459801, step = 140720 (8.004 sec)
INFO:tensorflow:lr = 9.7240045e-05 (8.005 sec)
INFO:tensorflow:global_step/sec: 12.246
INFO:tensorflow:loss = 1.2448704, step = 140820 (8.166 sec)
INFO:tensorflow:lr = 9.714235e-05 (8.166 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.94083
INFO:tensorflow:loss = 1.2432497, step = 140920 (12.593 sec)
INFO:tensorflow:lr = 9.7044765e-05 (12.594 sec)
INFO:tensorflow:global_step/sec: 12.578
INFO:tensorflow:loss = 1.2454319, step = 141020 (7.955 sec)
INFO:tensorflow:lr = 9.694729e-05 (7.955 sec)
INFO:tensorflow:global_step/sec: 12.2807
INFO:tensorflow:loss = 1.2427717, step = 141120 (8.142 sec)
INFO:tensorflow:lr = 9.68499e-05 (8.141 sec)
INFO:tensorflow:global_step/sec: 12.3299
INFO:tensorflow:loss = 1.2423016, step = 141220 (8.115 sec)
INFO:tensorflow:lr = 9.6752614e-05 (8.119 sec)
INFO:tensorflow:global_step/sec: 12.2827
INFO:tensorflow:loss = 1.2446163, step = 141320 (8.139 sec)
INFO:tensorflow:lr = 9.665543e-05 (8.135 sec)
INFO:tensorflow:global_step/sec: 12.4412
INFO:tensorflow:loss = 1.2545216, step = 141420 (8.038 sec)
INFO:tensorflow:lr = 9.655833e-05 (8.038 sec)
INFO:tensorflow:global_step/sec: 12.4062
INFO:tensorflow:loss = 1.2451398, step = 141520 (8.059 sec)
INFO:tensorflow:lr = 9.646134e-05 (8.059 sec)
INFO:tensorflow:global_step/sec: 12.2396
INFO:tensorflow:loss = 1.2458344, step = 141620 (8.166 sec)
INFO:tensorflow:lr = 9.6364434e-05 (8.171 sec)
INFO:tensorflow:global_step/sec: 12.5565
INFO:tensorflow:loss = 1.2435321, step = 141720 (7.964 sec)
INFO:tensorflow:lr = 9.626764e-05 (7.959 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.42035
INFO:tensorflow:loss = 1.2429127, step = 141820 (11.878 sec)
INFO:tensorflow:lr = 9.6170945e-05 (11.878 sec)
INFO:tensorflow:global_step/sec: 12.3013
INFO:tensorflow:loss = 1.2506694, step = 141920 (8.127 sec)
INFO:tensorflow:lr = 9.607432e-05 (8.126 sec)
INFO:tensorflow:global_step/sec: 12.7147
INFO:tensorflow:loss = 1.2428731, step = 142020 (7.865 sec)
INFO:tensorflow:lr = 9.597782e-05 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.5149
INFO:tensorflow:loss = 1.2532231, step = 142120 (7.991 sec)
INFO:tensorflow:lr = 9.5881405e-05 (7.990 sec)
INFO:tensorflow:global_step/sec: 12.3754
INFO:tensorflow:loss = 1.2438812, step = 142220 (8.080 sec)
INFO:tensorflow:lr = 9.578509e-05 (8.081 sec)
INFO:tensorflow:global_step/sec: 12.5211
INFO:tensorflow:loss = 1.2414047, step = 142320 (7.986 sec)
INFO:tensorflow:lr = 9.568886e-05 (7.985 sec)
INFO:tensorflow:global_step/sec: 12.4172
INFO:tensorflow:loss = 1.2448086, step = 142420 (8.059 sec)
INFO:tensorflow:lr = 9.559275e-05 (8.059 sec)
INFO:tensorflow:global_step/sec: 12.5996
INFO:tensorflow:loss = 1.241774, step = 142520 (7.939 sec)
INFO:tensorflow:lr = 9.549673e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.1413
INFO:tensorflow:loss = 1.2439814, step = 142620 (8.235 sec)
INFO:tensorflow:lr = 9.540079e-05 (8.232 sec)
INFO:tensorflow:global_step/sec: 12.2161
INFO:tensorflow:loss = 1.2453963, step = 142720 (8.186 sec)
INFO:tensorflow:lr = 9.530496e-05 (8.185 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.8836
INFO:tensorflow:loss = 1.2426373, step = 142820 (11.257 sec)
INFO:tensorflow:lr = 9.520922e-05 (11.256 sec)
INFO:tensorflow:global_step/sec: 12.6974
INFO:tensorflow:loss = 1.2442544, step = 142920 (7.873 sec)
INFO:tensorflow:lr = 9.511357e-05 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.4545
INFO:tensorflow:loss = 1.2444447, step = 143020 (8.030 sec)
INFO:tensorflow:lr = 9.501804e-05 (8.029 sec)
INFO:tensorflow:global_step/sec: 12.2781
INFO:tensorflow:loss = 1.2456886, step = 143120 (8.145 sec)
INFO:tensorflow:lr = 9.492259e-05 (8.146 sec)
INFO:tensorflow:global_step/sec: 12.6858
INFO:tensorflow:loss = 1.2470523, step = 143220 (7.878 sec)
INFO:tensorflow:lr = 9.482725e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.4909
INFO:tensorflow:loss = 1.2446479, step = 143320 (8.006 sec)
INFO:tensorflow:lr = 9.4731986e-05 (8.010 sec)
INFO:tensorflow:global_step/sec: 12.3774
INFO:tensorflow:loss = 1.2446898, step = 143420 (8.085 sec)
INFO:tensorflow:lr = 9.4636816e-05 (8.080 sec)
INFO:tensorflow:global_step/sec: 12.4325
INFO:tensorflow:loss = 1.2465398, step = 143520 (8.043 sec)
INFO:tensorflow:lr = 9.454176e-05 (8.043 sec)
INFO:tensorflow:global_step/sec: 12.2342
INFO:tensorflow:loss = 1.2445402, step = 143620 (8.173 sec)
INFO:tensorflow:lr = 9.444679e-05 (8.173 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1484
INFO:tensorflow:loss = 1.2433293, step = 143720 (8.235 sec)
INFO:tensorflow:lr = 9.435192e-05 (8.237 sec)
INFO:tensorflow:global_step/sec: 10.611
INFO:tensorflow:loss = 1.2452755, step = 143820 (9.419 sec)
INFO:tensorflow:lr = 9.4257135e-05 (9.417 sec)
INFO:tensorflow:global_step/sec: 12.7544
INFO:tensorflow:loss = 1.2486116, step = 143920 (7.843 sec)
INFO:tensorflow:lr = 9.4162446e-05 (7.843 sec)
INFO:tensorflow:global_step/sec: 12.6621
INFO:tensorflow:loss = 1.2436063, step = 144020 (7.892 sec)
INFO:tensorflow:lr = 9.4067866e-05 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.3106
INFO:tensorflow:loss = 1.2431039, step = 144120 (8.124 sec)
INFO:tensorflow:lr = 9.3973365e-05 (8.124 sec)
INFO:tensorflow:global_step/sec: 12.5707
INFO:tensorflow:loss = 1.2427852, step = 144220 (7.954 sec)
INFO:tensorflow:lr = 9.387897e-05 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.4048
INFO:tensorflow:loss = 1.2442795, step = 144320 (8.063 sec)
INFO:tensorflow:lr = 9.3784656e-05 (8.064 sec)
INFO:tensorflow:global_step/sec: 12.5874
INFO:tensorflow:loss = 1.24356, step = 144420 (7.947 sec)
INFO:tensorflow:lr = 9.369045e-05 (7.947 sec)
INFO:tensorflow:global_step/sec: 12.514
INFO:tensorflow:loss = 1.2426248, step = 144520 (7.989 sec)
INFO:tensorflow:lr = 9.359634e-05 (7.988 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2544
INFO:tensorflow:loss = 1.2479446, step = 144620 (8.165 sec)
INFO:tensorflow:lr = 9.350232e-05 (8.166 sec)
INFO:tensorflow:global_step/sec: 10.9916
INFO:tensorflow:loss = 1.2435095, step = 144720 (9.092 sec)
INFO:tensorflow:lr = 9.3408395e-05 (9.091 sec)
INFO:tensorflow:global_step/sec: 12.7682
INFO:tensorflow:loss = 1.2506919, step = 144820 (7.832 sec)
INFO:tensorflow:lr = 9.3314564e-05 (7.831 sec)
INFO:tensorflow:global_step/sec: 12.4579
INFO:tensorflow:loss = 1.2430148, step = 144920 (8.028 sec)
INFO:tensorflow:lr = 9.322082e-05 (8.032 sec)
INFO:tensorflow:global_step/sec: 12.5404
INFO:tensorflow:loss = 1.2427722, step = 145020 (7.975 sec)
INFO:tensorflow:lr = 9.3127186e-05 (7.969 sec)
INFO:tensorflow:global_step/sec: 12.6
INFO:tensorflow:loss = 1.2560487, step = 145120 (7.941 sec)
INFO:tensorflow:lr = 9.303363e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.4571
INFO:tensorflow:loss = 1.2459077, step = 145220 (8.022 sec)
INFO:tensorflow:lr = 9.294019e-05 (8.021 sec)
INFO:tensorflow:global_step/sec: 12.7962
INFO:tensorflow:loss = 1.2429833, step = 145320 (7.815 sec)
INFO:tensorflow:lr = 9.284682e-05 (7.816 sec)
INFO:tensorflow:global_step/sec: 12.6749
INFO:tensorflow:loss = 1.244671, step = 145420 (7.890 sec)
INFO:tensorflow:lr = 9.275354e-05 (7.893 sec)
INFO:tensorflow:global_step/sec: 12.7
INFO:tensorflow:loss = 1.2438098, step = 145520 (7.877 sec)
INFO:tensorflow:lr = 9.2660375e-05 (7.873 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.5416
INFO:tensorflow:loss = 1.2416648, step = 145620 (8.670 sec)
INFO:tensorflow:lr = 9.25673e-05 (8.670 sec)
INFO:tensorflow:global_step/sec: 11.4268
INFO:tensorflow:loss = 1.2421402, step = 145720 (8.746 sec)
INFO:tensorflow:lr = 9.2474314e-05 (8.750 sec)
INFO:tensorflow:global_step/sec: 12.6866
INFO:tensorflow:loss = 1.2447598, step = 145820 (7.886 sec)
INFO:tensorflow:lr = 9.2381415e-05 (7.881 sec)
INFO:tensorflow:global_step/sec: 12.6577
INFO:tensorflow:loss = 1.2479534, step = 145920 (7.901 sec)
INFO:tensorflow:lr = 9.228862e-05 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.1214
INFO:tensorflow:loss = 1.2518696, step = 146020 (8.243 sec)
INFO:tensorflow:lr = 9.219592e-05 (8.245 sec)
INFO:tensorflow:global_step/sec: 12.8833
INFO:tensorflow:loss = 1.248869, step = 146120 (7.764 sec)
INFO:tensorflow:lr = 9.210329e-05 (7.762 sec)
INFO:tensorflow:global_step/sec: 12.4983
INFO:tensorflow:loss = 1.2434883, step = 146220 (7.999 sec)
INFO:tensorflow:lr = 9.2010785e-05 (8.001 sec)
INFO:tensorflow:global_step/sec: 12.7547
INFO:tensorflow:loss = 1.2447973, step = 146320 (7.843 sec)
INFO:tensorflow:lr = 9.1918344e-05 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.4445
INFO:tensorflow:loss = 1.246257, step = 146420 (8.035 sec)
INFO:tensorflow:lr = 9.182601e-05 (8.034 sec)
INFO:tensorflow:global_step/sec: 12.6804
INFO:tensorflow:loss = 1.2494022, step = 146520 (7.884 sec)
INFO:tensorflow:lr = 9.173378e-05 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.6978
INFO:tensorflow:loss = 1.2443601, step = 146620 (7.877 sec)
INFO:tensorflow:lr = 9.164162e-05 (7.877 sec)
INFO:tensorflow:Saving checkpoints for 146700 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2431201.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-146700
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-146700
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.724
INFO:tensorflow:Best (Exact Match) Accuracy: 0.724
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-146700
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 146700 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2443894, step = 146700
INFO:tensorflow:lr = 9.156797e-05
INFO:tensorflow:global_step/sec: 10.051
INFO:tensorflow:loss = 1.244071, step = 146800 (9.952 sec)
INFO:tensorflow:lr = 9.1475995e-05 (9.956 sec)
INFO:tensorflow:global_step/sec: 12.6786
INFO:tensorflow:loss = 1.255505, step = 146900 (7.891 sec)
INFO:tensorflow:lr = 9.138411e-05 (7.887 sec)
INFO:tensorflow:global_step/sec: 12.6207
INFO:tensorflow:loss = 1.2456456, step = 147000 (7.924 sec)
INFO:tensorflow:lr = 9.129231e-05 (7.924 sec)
INFO:tensorflow:global_step/sec: 12.7906
INFO:tensorflow:loss = 1.2438047, step = 147100 (7.815 sec)
INFO:tensorflow:lr = 9.12006e-05 (7.816 sec)
INFO:tensorflow:global_step/sec: 12.5422
INFO:tensorflow:loss = 1.2472233, step = 147200 (7.972 sec)
INFO:tensorflow:lr = 9.1108974e-05 (7.971 sec)
INFO:tensorflow:global_step/sec: 12.6121
INFO:tensorflow:loss = 1.2505473, step = 147300 (7.928 sec)
INFO:tensorflow:lr = 9.101747e-05 (7.928 sec)
INFO:tensorflow:global_step/sec: 12.5697
INFO:tensorflow:loss = 1.245287, step = 147400 (7.956 sec)
INFO:tensorflow:lr = 9.092603e-05 (7.963 sec)
INFO:tensorflow:global_step/sec: 12.6833
INFO:tensorflow:loss = 1.2446585, step = 147500 (7.886 sec)
INFO:tensorflow:lr = 9.08347e-05 (7.880 sec)
INFO:tensorflow:global_step/sec: 12.8006
INFO:tensorflow:loss = 1.2419182, step = 147600 (7.811 sec)
INFO:tensorflow:lr = 9.0743444e-05 (7.811 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.31527
INFO:tensorflow:loss = 1.2440436, step = 147700 (12.030 sec)
INFO:tensorflow:lr = 9.065229e-05 (12.028 sec)
INFO:tensorflow:global_step/sec: 12.5065
INFO:tensorflow:loss = 1.2445109, step = 147800 (7.991 sec)
INFO:tensorflow:lr = 9.056123e-05 (7.991 sec)
INFO:tensorflow:global_step/sec: 12.7083
INFO:tensorflow:loss = 1.2437775, step = 147900 (7.869 sec)
INFO:tensorflow:lr = 9.047026e-05 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.5151
INFO:tensorflow:loss = 1.247248, step = 148000 (7.991 sec)
INFO:tensorflow:lr = 9.0379384e-05 (7.992 sec)
INFO:tensorflow:global_step/sec: 12.2781
INFO:tensorflow:loss = 1.244056, step = 148100 (8.146 sec)
INFO:tensorflow:lr = 9.028859e-05 (8.147 sec)
INFO:tensorflow:global_step/sec: 12.6575
INFO:tensorflow:loss = 1.2453225, step = 148200 (7.899 sec)
INFO:tensorflow:lr = 9.019789e-05 (7.897 sec)
INFO:tensorflow:global_step/sec: 12.6457
INFO:tensorflow:loss = 1.2532479, step = 148300 (7.917 sec)
INFO:tensorflow:lr = 9.010729e-05 (7.918 sec)
INFO:tensorflow:global_step/sec: 12.6258
INFO:tensorflow:loss = 1.2450638, step = 148400 (7.911 sec)
INFO:tensorflow:lr = 9.001677e-05 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.4214
INFO:tensorflow:loss = 1.2449104, step = 148500 (8.051 sec)
INFO:tensorflow:lr = 8.9926354e-05 (8.050 sec)
INFO:tensorflow:global_step/sec: 12.9721
INFO:tensorflow:loss = 1.2434419, step = 148600 (7.709 sec)
INFO:tensorflow:lr = 8.9836016e-05 (7.717 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.28238
INFO:tensorflow:loss = 1.2493786, step = 148700 (12.079 sec)
INFO:tensorflow:lr = 8.9745765e-05 (12.071 sec)
INFO:tensorflow:global_step/sec: 12.7538
INFO:tensorflow:loss = 1.2464718, step = 148800 (7.841 sec)
INFO:tensorflow:lr = 8.9655616e-05 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.9883
INFO:tensorflow:loss = 1.2417631, step = 148900 (7.699 sec)
INFO:tensorflow:lr = 8.9565554e-05 (7.699 sec)
INFO:tensorflow:global_step/sec: 12.7568
INFO:tensorflow:loss = 1.2475207, step = 149000 (7.839 sec)
INFO:tensorflow:lr = 8.9475594e-05 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.7225
INFO:tensorflow:loss = 1.245023, step = 149100 (7.860 sec)
INFO:tensorflow:lr = 8.938571e-05 (7.860 sec)
INFO:tensorflow:global_step/sec: 12.4462
INFO:tensorflow:loss = 1.245929, step = 149200 (8.034 sec)
INFO:tensorflow:lr = 8.9295914e-05 (8.034 sec)
INFO:tensorflow:global_step/sec: 12.679
INFO:tensorflow:loss = 1.2436159, step = 149300 (7.886 sec)
INFO:tensorflow:lr = 8.920622e-05 (7.886 sec)
INFO:tensorflow:global_step/sec: 12.6329
INFO:tensorflow:loss = 1.2462329, step = 149400 (7.917 sec)
INFO:tensorflow:lr = 8.91166e-05 (7.917 sec)
INFO:tensorflow:global_step/sec: 12.5809
INFO:tensorflow:loss = 1.2441921, step = 149500 (7.948 sec)
INFO:tensorflow:lr = 8.902709e-05 (7.949 sec)
INFO:tensorflow:global_step/sec: 12.7485
INFO:tensorflow:loss = 1.2438712, step = 149600 (7.840 sec)
INFO:tensorflow:lr = 8.893766e-05 (7.840 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.29717
INFO:tensorflow:loss = 1.2439181, step = 149700 (12.053 sec)
INFO:tensorflow:lr = 8.884831e-05 (12.054 sec)
INFO:tensorflow:global_step/sec: 12.469
INFO:tensorflow:loss = 1.2439133, step = 149800 (8.019 sec)
INFO:tensorflow:lr = 8.8759065e-05 (8.019 sec)
INFO:tensorflow:global_step/sec: 12.5088
INFO:tensorflow:loss = 1.243963, step = 149900 (7.994 sec)
INFO:tensorflow:lr = 8.86699e-05 (7.993 sec)
INFO:tensorflow:global_step/sec: 12.9688
INFO:tensorflow:loss = 1.2440338, step = 150000 (7.711 sec)
INFO:tensorflow:lr = 8.858084e-05 (7.711 sec)
INFO:tensorflow:global_step/sec: 12.8106
INFO:tensorflow:loss = 1.2429388, step = 150100 (7.806 sec)
INFO:tensorflow:lr = 8.849185e-05 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.6214
INFO:tensorflow:loss = 1.2436142, step = 150200 (7.924 sec)
INFO:tensorflow:lr = 8.840295e-05 (7.923 sec)
INFO:tensorflow:global_step/sec: 12.281
INFO:tensorflow:loss = 1.2437512, step = 150300 (8.143 sec)
INFO:tensorflow:lr = 8.8314155e-05 (8.142 sec)
INFO:tensorflow:global_step/sec: 13.0256
INFO:tensorflow:loss = 1.2468607, step = 150400 (7.680 sec)
INFO:tensorflow:lr = 8.822544e-05 (7.681 sec)
INFO:tensorflow:global_step/sec: 12.1457
INFO:tensorflow:loss = 1.2475142, step = 150500 (8.236 sec)
INFO:tensorflow:lr = 8.8136825e-05 (8.236 sec)
INFO:tensorflow:global_step/sec: 12.1629
INFO:tensorflow:loss = 1.2439152, step = 150600 (8.227 sec)
INFO:tensorflow:lr = 8.8048284e-05 (8.227 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.27788
INFO:tensorflow:loss = 1.2460039, step = 150700 (12.070 sec)
INFO:tensorflow:lr = 8.795983e-05 (12.071 sec)
INFO:tensorflow:global_step/sec: 12.1396
INFO:tensorflow:loss = 1.244453, step = 150800 (8.235 sec)
INFO:tensorflow:lr = 8.7871485e-05 (8.236 sec)
INFO:tensorflow:global_step/sec: 12.3241
INFO:tensorflow:loss = 1.2413253, step = 150900 (8.114 sec)
INFO:tensorflow:lr = 8.7783206e-05 (8.113 sec)
INFO:tensorflow:global_step/sec: 12.7433
INFO:tensorflow:loss = 1.2435942, step = 151000 (7.848 sec)
INFO:tensorflow:lr = 8.769503e-05 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.4367
INFO:tensorflow:loss = 1.2434167, step = 151100 (8.047 sec)
INFO:tensorflow:lr = 8.760694e-05 (8.048 sec)
INFO:tensorflow:global_step/sec: 12.1844
INFO:tensorflow:loss = 1.2427095, step = 151200 (8.200 sec)
INFO:tensorflow:lr = 8.751893e-05 (8.202 sec)
INFO:tensorflow:global_step/sec: 12.4128
INFO:tensorflow:loss = 1.2415925, step = 151300 (8.060 sec)
INFO:tensorflow:lr = 8.743102e-05 (8.057 sec)
INFO:tensorflow:global_step/sec: 12.3837
INFO:tensorflow:loss = 1.2425196, step = 151400 (8.078 sec)
INFO:tensorflow:lr = 8.7343185e-05 (8.078 sec)
INFO:tensorflow:global_step/sec: 12.7142
INFO:tensorflow:loss = 1.2500411, step = 151500 (7.865 sec)
INFO:tensorflow:lr = 8.725546e-05 (7.866 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.63353
INFO:tensorflow:loss = 1.2459517, step = 151600 (11.579 sec)
INFO:tensorflow:lr = 8.71678e-05 (11.582 sec)
INFO:tensorflow:global_step/sec: 12.2656
INFO:tensorflow:loss = 1.2423538, step = 151700 (8.149 sec)
INFO:tensorflow:lr = 8.708024e-05 (8.147 sec)
INFO:tensorflow:global_step/sec: 12.6121
INFO:tensorflow:loss = 1.2505404, step = 151800 (7.934 sec)
INFO:tensorflow:lr = 8.699277e-05 (7.934 sec)
INFO:tensorflow:global_step/sec: 12.7894
INFO:tensorflow:loss = 1.2456331, step = 151900 (7.814 sec)
INFO:tensorflow:lr = 8.690538e-05 (7.813 sec)
INFO:tensorflow:global_step/sec: 12.5493
INFO:tensorflow:loss = 1.246384, step = 152000 (7.971 sec)
INFO:tensorflow:lr = 8.681809e-05 (7.973 sec)
INFO:tensorflow:global_step/sec: 12.3397
INFO:tensorflow:loss = 1.2433354, step = 152100 (8.101 sec)
INFO:tensorflow:lr = 8.673086e-05 (8.100 sec)
INFO:tensorflow:global_step/sec: 12.3386
INFO:tensorflow:loss = 1.2442598, step = 152200 (8.106 sec)
INFO:tensorflow:lr = 8.664373e-05 (8.106 sec)
INFO:tensorflow:global_step/sec: 12.7453
INFO:tensorflow:loss = 1.2427703, step = 152300 (7.844 sec)
INFO:tensorflow:lr = 8.655672e-05 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.9112
INFO:tensorflow:loss = 1.2528266, step = 152400 (7.746 sec)
INFO:tensorflow:lr = 8.6469765e-05 (7.744 sec)
INFO:tensorflow:global_step/sec: 12.8283
INFO:tensorflow:loss = 1.2462392, step = 152500 (7.801 sec)
INFO:tensorflow:lr = 8.6382905e-05 (7.800 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.06405
INFO:tensorflow:loss = 1.2444615, step = 152600 (11.031 sec)
INFO:tensorflow:lr = 8.6296124e-05 (11.031 sec)
INFO:tensorflow:global_step/sec: 13.1834
INFO:tensorflow:loss = 1.2434341, step = 152700 (7.585 sec)
INFO:tensorflow:lr = 8.6209424e-05 (7.585 sec)
INFO:tensorflow:global_step/sec: 12.618
INFO:tensorflow:loss = 1.2439532, step = 152800 (7.920 sec)
INFO:tensorflow:lr = 8.612283e-05 (7.921 sec)
INFO:tensorflow:global_step/sec: 12.5351
INFO:tensorflow:loss = 1.2488467, step = 152900 (7.978 sec)
INFO:tensorflow:lr = 8.6036314e-05 (7.978 sec)
INFO:tensorflow:global_step/sec: 12.4584
INFO:tensorflow:loss = 1.2502102, step = 153000 (8.026 sec)
INFO:tensorflow:lr = 8.59499e-05 (8.026 sec)
INFO:tensorflow:global_step/sec: 12.8334
INFO:tensorflow:loss = 1.2436447, step = 153100 (7.795 sec)
INFO:tensorflow:lr = 8.586356e-05 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.9761
INFO:tensorflow:loss = 1.2446896, step = 153200 (7.709 sec)
INFO:tensorflow:lr = 8.5777305e-05 (7.707 sec)
INFO:tensorflow:global_step/sec: 12.5871
INFO:tensorflow:loss = 1.2448373, step = 153300 (7.939 sec)
INFO:tensorflow:lr = 8.569114e-05 (7.939 sec)
INFO:tensorflow:global_step/sec: 12.3519
INFO:tensorflow:loss = 1.24809, step = 153400 (8.097 sec)
INFO:tensorflow:lr = 8.560506e-05 (8.101 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1207
INFO:tensorflow:loss = 1.243688, step = 153500 (8.260 sec)
INFO:tensorflow:lr = 8.5519074e-05 (8.259 sec)
INFO:tensorflow:global_step/sec: 10.5819
INFO:tensorflow:loss = 1.2423753, step = 153600 (9.445 sec)
INFO:tensorflow:lr = 8.543317e-05 (9.445 sec)
INFO:tensorflow:global_step/sec: 12.5556
INFO:tensorflow:loss = 1.2469901, step = 153700 (7.965 sec)
INFO:tensorflow:lr = 8.534733e-05 (7.963 sec)
INFO:tensorflow:global_step/sec: 12.8293
INFO:tensorflow:loss = 1.2434926, step = 153800 (7.793 sec)
INFO:tensorflow:lr = 8.5261614e-05 (7.793 sec)
INFO:tensorflow:global_step/sec: 12.517
INFO:tensorflow:loss = 1.2455355, step = 153900 (7.987 sec)
INFO:tensorflow:lr = 8.517596e-05 (7.987 sec)
INFO:tensorflow:global_step/sec: 12.5719
INFO:tensorflow:loss = 1.2419705, step = 154000 (7.952 sec)
INFO:tensorflow:lr = 8.50904e-05 (7.954 sec)
INFO:tensorflow:global_step/sec: 12.5582
INFO:tensorflow:loss = 1.2438302, step = 154100 (7.966 sec)
INFO:tensorflow:lr = 8.500492e-05 (7.964 sec)
INFO:tensorflow:global_step/sec: 12.7461
INFO:tensorflow:loss = 1.2498709, step = 154200 (7.842 sec)
INFO:tensorflow:lr = 8.491953e-05 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.4289
INFO:tensorflow:loss = 1.2408761, step = 154300 (8.048 sec)
INFO:tensorflow:lr = 8.483423e-05 (8.048 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.6554
INFO:tensorflow:loss = 1.2410917, step = 154400 (7.906 sec)
INFO:tensorflow:lr = 8.474901e-05 (7.906 sec)
INFO:tensorflow:global_step/sec: 10.9855
INFO:tensorflow:loss = 1.2470044, step = 154500 (9.102 sec)
INFO:tensorflow:lr = 8.466389e-05 (9.103 sec)
INFO:tensorflow:global_step/sec: 12.8813
INFO:tensorflow:loss = 1.2450987, step = 154600 (7.757 sec)
INFO:tensorflow:lr = 8.457883e-05 (7.757 sec)
INFO:tensorflow:global_step/sec: 12.3704
INFO:tensorflow:loss = 1.243781, step = 154700 (8.091 sec)
INFO:tensorflow:lr = 8.449386e-05 (8.096 sec)
INFO:tensorflow:global_step/sec: 12.8307
INFO:tensorflow:loss = 1.2424403, step = 154800 (7.790 sec)
INFO:tensorflow:lr = 8.440899e-05 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.7739
INFO:tensorflow:loss = 1.2446392, step = 154900 (7.831 sec)
INFO:tensorflow:lr = 8.43242e-05 (7.829 sec)
INFO:tensorflow:global_step/sec: 12.4939
INFO:tensorflow:loss = 1.2413216, step = 155000 (7.998 sec)
INFO:tensorflow:lr = 8.42395e-05 (8.005 sec)
INFO:tensorflow:global_step/sec: 12.6264
INFO:tensorflow:loss = 1.2452991, step = 155100 (7.920 sec)
INFO:tensorflow:lr = 8.4154875e-05 (7.921 sec)
INFO:tensorflow:global_step/sec: 12.6364
INFO:tensorflow:loss = 1.2444293, step = 155200 (7.916 sec)
INFO:tensorflow:lr = 8.4070336e-05 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.6398
INFO:tensorflow:loss = 1.2430124, step = 155300 (7.916 sec)
INFO:tensorflow:lr = 8.398589e-05 (7.913 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0453
INFO:tensorflow:loss = 1.2424821, step = 155400 (8.309 sec)
INFO:tensorflow:lr = 8.390151e-05 (8.317 sec)
INFO:tensorflow:global_step/sec: 11.2988
INFO:tensorflow:loss = 1.2471951, step = 155500 (8.845 sec)
INFO:tensorflow:lr = 8.381725e-05 (8.837 sec)
INFO:tensorflow:global_step/sec: 12.8677
INFO:tensorflow:loss = 1.2544374, step = 155600 (7.768 sec)
INFO:tensorflow:lr = 8.3733044e-05 (7.768 sec)
INFO:tensorflow:global_step/sec: 12.6591
INFO:tensorflow:loss = 1.2498583, step = 155700 (7.899 sec)
INFO:tensorflow:lr = 8.364893e-05 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.7241
INFO:tensorflow:loss = 1.2448832, step = 155800 (7.859 sec)
INFO:tensorflow:lr = 8.3564904e-05 (7.858 sec)
INFO:tensorflow:global_step/sec: 12.6629
INFO:tensorflow:loss = 1.244978, step = 155900 (7.894 sec)
INFO:tensorflow:lr = 8.348096e-05 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.6465
INFO:tensorflow:loss = 1.2439777, step = 156000 (7.908 sec)
INFO:tensorflow:lr = 8.3397106e-05 (7.910 sec)
INFO:tensorflow:global_step/sec: 11.9459
INFO:tensorflow:loss = 1.2434794, step = 156100 (8.375 sec)
INFO:tensorflow:lr = 8.331332e-05 (8.374 sec)
INFO:tensorflow:global_step/sec: 12.5495
INFO:tensorflow:loss = 1.2426113, step = 156200 (7.969 sec)
INFO:tensorflow:lr = 8.322963e-05 (7.969 sec)
INFO:tensorflow:global_step/sec: 12.7922
INFO:tensorflow:loss = 1.2448606, step = 156300 (7.814 sec)
INFO:tensorflow:lr = 8.3146035e-05 (7.814 sec)
INFO:tensorflow:global_step/sec: 13.0554
INFO:tensorflow:loss = 1.2424155, step = 156400 (7.660 sec)
INFO:tensorflow:lr = 8.306251e-05 (7.660 sec)
INFO:tensorflow:Saving checkpoints for 156480 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2409595.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-156480
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-156480
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.731
INFO:tensorflow:Best (Exact Match) Accuracy: 0.731
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-156480
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 156480 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2545527, step = 156480
INFO:tensorflow:lr = 8.299575e-05
INFO:tensorflow:global_step/sec: 10.0548
INFO:tensorflow:loss = 1.2425964, step = 156580 (9.952 sec)
INFO:tensorflow:lr = 8.291238e-05 (9.953 sec)
INFO:tensorflow:global_step/sec: 12.7802
INFO:tensorflow:loss = 1.243327, step = 156680 (7.821 sec)
INFO:tensorflow:lr = 8.282909e-05 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.544
INFO:tensorflow:loss = 1.2435379, step = 156780 (7.972 sec)
INFO:tensorflow:lr = 8.2745886e-05 (7.971 sec)
INFO:tensorflow:global_step/sec: 12.7211
INFO:tensorflow:loss = 1.2486848, step = 156880 (7.867 sec)
INFO:tensorflow:lr = 8.266277e-05 (7.867 sec)
INFO:tensorflow:global_step/sec: 13.0432
INFO:tensorflow:loss = 1.2423004, step = 156980 (7.664 sec)
INFO:tensorflow:lr = 8.2579725e-05 (7.663 sec)
INFO:tensorflow:global_step/sec: 12.7176
INFO:tensorflow:loss = 1.2446653, step = 157080 (7.861 sec)
INFO:tensorflow:lr = 8.249678e-05 (7.862 sec)
INFO:tensorflow:global_step/sec: 12.6615
INFO:tensorflow:loss = 1.2431146, step = 157180 (7.901 sec)
INFO:tensorflow:lr = 8.2413906e-05 (7.900 sec)
INFO:tensorflow:global_step/sec: 12.6109
INFO:tensorflow:loss = 1.2475405, step = 157280 (7.930 sec)
INFO:tensorflow:lr = 8.233111e-05 (7.930 sec)
INFO:tensorflow:global_step/sec: 12.9061
INFO:tensorflow:loss = 1.2426296, step = 157380 (7.748 sec)
INFO:tensorflow:lr = 8.2248414e-05 (7.748 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.17322
INFO:tensorflow:loss = 1.2472751, step = 157480 (12.237 sec)
INFO:tensorflow:lr = 8.2165796e-05 (12.237 sec)
INFO:tensorflow:global_step/sec: 12.8058
INFO:tensorflow:loss = 1.2430243, step = 157580 (7.808 sec)
INFO:tensorflow:lr = 8.208326e-05 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.7737
INFO:tensorflow:loss = 1.2482195, step = 157680 (7.823 sec)
INFO:tensorflow:lr = 8.20008e-05 (7.826 sec)
INFO:tensorflow:global_step/sec: 12.731
INFO:tensorflow:loss = 1.2453948, step = 157780 (7.857 sec)
INFO:tensorflow:lr = 8.191841e-05 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.7219
INFO:tensorflow:loss = 1.2427235, step = 157880 (7.866 sec)
INFO:tensorflow:lr = 8.183614e-05 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.5526
INFO:tensorflow:loss = 1.2457312, step = 157980 (7.964 sec)
INFO:tensorflow:lr = 8.1753926e-05 (7.964 sec)
INFO:tensorflow:global_step/sec: 12.6871
INFO:tensorflow:loss = 1.2447507, step = 158080 (7.878 sec)
INFO:tensorflow:lr = 8.167181e-05 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.585
INFO:tensorflow:loss = 1.2416404, step = 158180 (7.946 sec)
INFO:tensorflow:lr = 8.1589766e-05 (7.949 sec)
INFO:tensorflow:global_step/sec: 12.7264
INFO:tensorflow:loss = 1.2412192, step = 158280 (7.863 sec)
INFO:tensorflow:lr = 8.15078e-05 (7.861 sec)
INFO:tensorflow:global_step/sec: 12.7235
INFO:tensorflow:loss = 1.2459588, step = 158380 (7.854 sec)
INFO:tensorflow:lr = 8.142593e-05 (7.854 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.34295
INFO:tensorflow:loss = 1.2420511, step = 158480 (11.987 sec)
INFO:tensorflow:lr = 8.134413e-05 (11.986 sec)
INFO:tensorflow:global_step/sec: 12.714
INFO:tensorflow:loss = 1.2457771, step = 158580 (7.865 sec)
INFO:tensorflow:lr = 8.126243e-05 (7.864 sec)
INFO:tensorflow:global_step/sec: 12.6987
INFO:tensorflow:loss = 1.2400635, step = 158680 (7.875 sec)
INFO:tensorflow:lr = 8.11808e-05 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.8282
INFO:tensorflow:loss = 1.2438774, step = 158780 (7.796 sec)
INFO:tensorflow:lr = 8.109924e-05 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.8694
INFO:tensorflow:loss = 1.2427423, step = 158880 (7.770 sec)
INFO:tensorflow:lr = 8.101778e-05 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.6658
INFO:tensorflow:loss = 1.241447, step = 158980 (7.896 sec)
INFO:tensorflow:lr = 8.093639e-05 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.5078
INFO:tensorflow:loss = 1.2422627, step = 159080 (7.998 sec)
INFO:tensorflow:lr = 8.08551e-05 (8.001 sec)
INFO:tensorflow:global_step/sec: 12.6664
INFO:tensorflow:loss = 1.250941, step = 159180 (7.897 sec)
INFO:tensorflow:lr = 8.077386e-05 (7.900 sec)
INFO:tensorflow:global_step/sec: 12.7541
INFO:tensorflow:loss = 1.2464032, step = 159280 (7.841 sec)
INFO:tensorflow:lr = 8.069272e-05 (7.836 sec)
INFO:tensorflow:global_step/sec: 12.7697
INFO:tensorflow:loss = 1.2432774, step = 159380 (7.831 sec)
INFO:tensorflow:lr = 8.0611666e-05 (7.831 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.30956
INFO:tensorflow:loss = 1.245586, step = 159480 (12.031 sec)
INFO:tensorflow:lr = 8.053069e-05 (12.032 sec)
INFO:tensorflow:global_step/sec: 12.7577
INFO:tensorflow:loss = 1.2436898, step = 159580 (7.840 sec)
INFO:tensorflow:lr = 8.0449805e-05 (7.840 sec)
INFO:tensorflow:global_step/sec: 12.6921
INFO:tensorflow:loss = 1.2427038, step = 159680 (7.880 sec)
INFO:tensorflow:lr = 8.036898e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.5858
INFO:tensorflow:loss = 1.2463199, step = 159780 (7.940 sec)
INFO:tensorflow:lr = 8.028825e-05 (7.940 sec)
INFO:tensorflow:global_step/sec: 12.9176
INFO:tensorflow:loss = 1.2422549, step = 159880 (7.743 sec)
INFO:tensorflow:lr = 8.02076e-05 (7.746 sec)
INFO:tensorflow:global_step/sec: 12.7488
INFO:tensorflow:loss = 1.2433963, step = 159980 (7.847 sec)
INFO:tensorflow:lr = 8.0127036e-05 (7.844 sec)
INFO:tensorflow:global_step/sec: 12.8153
INFO:tensorflow:loss = 1.2405639, step = 160080 (7.804 sec)
INFO:tensorflow:lr = 8.004654e-05 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.7982
INFO:tensorflow:loss = 1.2429812, step = 160180 (7.810 sec)
INFO:tensorflow:lr = 7.996613e-05 (7.810 sec)
INFO:tensorflow:global_step/sec: 12.5992
INFO:tensorflow:loss = 1.2426969, step = 160280 (7.935 sec)
INFO:tensorflow:lr = 7.9885795e-05 (7.935 sec)
INFO:tensorflow:global_step/sec: 12.6284
INFO:tensorflow:loss = 1.2485273, step = 160380 (7.924 sec)
INFO:tensorflow:lr = 7.9805555e-05 (7.924 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.43014
INFO:tensorflow:loss = 1.2451617, step = 160480 (11.859 sec)
INFO:tensorflow:lr = 7.972538e-05 (11.859 sec)
INFO:tensorflow:global_step/sec: 12.8098
INFO:tensorflow:loss = 1.2438232, step = 160580 (7.804 sec)
INFO:tensorflow:lr = 7.9645295e-05 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.8416
INFO:tensorflow:loss = 1.2421925, step = 160680 (7.787 sec)
INFO:tensorflow:lr = 7.9565296e-05 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.8333
INFO:tensorflow:loss = 1.2429509, step = 160780 (7.792 sec)
INFO:tensorflow:lr = 7.948537e-05 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.7757
INFO:tensorflow:loss = 1.2418758, step = 160880 (7.828 sec)
INFO:tensorflow:lr = 7.940552e-05 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.6713
INFO:tensorflow:loss = 1.2432858, step = 160980 (7.896 sec)
INFO:tensorflow:lr = 7.9325764e-05 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.5948
INFO:tensorflow:loss = 1.24457, step = 161080 (7.943 sec)
INFO:tensorflow:lr = 7.9246085e-05 (7.944 sec)
INFO:tensorflow:global_step/sec: 12.7125
INFO:tensorflow:loss = 1.2471696, step = 161180 (7.864 sec)
INFO:tensorflow:lr = 7.916647e-05 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.8499
INFO:tensorflow:loss = 1.2433884, step = 161280 (7.782 sec)
INFO:tensorflow:lr = 7.9086945e-05 (7.782 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.62131
INFO:tensorflow:loss = 1.2433494, step = 161380 (11.599 sec)
INFO:tensorflow:lr = 7.900751e-05 (11.598 sec)
INFO:tensorflow:global_step/sec: 12.575
INFO:tensorflow:loss = 1.2430332, step = 161480 (7.952 sec)
INFO:tensorflow:lr = 7.892813e-05 (7.952 sec)
INFO:tensorflow:global_step/sec: 12.7951
INFO:tensorflow:loss = 1.2427179, step = 161580 (7.815 sec)
INFO:tensorflow:lr = 7.884885e-05 (7.815 sec)
INFO:tensorflow:global_step/sec: 12.7562
INFO:tensorflow:loss = 1.2430513, step = 161680 (7.841 sec)
INFO:tensorflow:lr = 7.876965e-05 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.3947
INFO:tensorflow:loss = 1.2428813, step = 161780 (8.065 sec)
INFO:tensorflow:lr = 7.8690515e-05 (8.064 sec)
INFO:tensorflow:global_step/sec: 12.5447
INFO:tensorflow:loss = 1.2428411, step = 161880 (7.968 sec)
INFO:tensorflow:lr = 7.8611476e-05 (7.969 sec)
INFO:tensorflow:global_step/sec: 12.5711
INFO:tensorflow:loss = 1.2425469, step = 161980 (7.958 sec)
INFO:tensorflow:lr = 7.8532496e-05 (7.958 sec)
INFO:tensorflow:global_step/sec: 12.9131
INFO:tensorflow:loss = 1.2412182, step = 162080 (7.746 sec)
INFO:tensorflow:lr = 7.845362e-05 (7.746 sec)
INFO:tensorflow:global_step/sec: 12.4472
INFO:tensorflow:loss = 1.2435589, step = 162180 (8.033 sec)
INFO:tensorflow:lr = 7.8374804e-05 (8.034 sec)
INFO:tensorflow:global_step/sec: 12.8406
INFO:tensorflow:loss = 1.2414767, step = 162280 (7.783 sec)
INFO:tensorflow:lr = 7.829606e-05 (7.784 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.14022
INFO:tensorflow:loss = 1.242339, step = 162380 (10.944 sec)
INFO:tensorflow:lr = 7.8217425e-05 (10.944 sec)
INFO:tensorflow:global_step/sec: 12.7715
INFO:tensorflow:loss = 1.2425467, step = 162480 (7.827 sec)
INFO:tensorflow:lr = 7.8138844e-05 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.3174
INFO:tensorflow:loss = 1.2458082, step = 162580 (8.123 sec)
INFO:tensorflow:lr = 7.8060366e-05 (8.122 sec)
INFO:tensorflow:global_step/sec: 12.43
INFO:tensorflow:loss = 1.2450854, step = 162680 (8.040 sec)
INFO:tensorflow:lr = 7.7981946e-05 (8.040 sec)
INFO:tensorflow:global_step/sec: 12.8185
INFO:tensorflow:loss = 1.2413714, step = 162780 (7.808 sec)
INFO:tensorflow:lr = 7.7903605e-05 (7.808 sec)
INFO:tensorflow:global_step/sec: 12.8459
INFO:tensorflow:loss = 1.2418839, step = 162880 (7.782 sec)
INFO:tensorflow:lr = 7.782536e-05 (7.782 sec)
INFO:tensorflow:global_step/sec: 12.6585
INFO:tensorflow:loss = 1.2452873, step = 162980 (7.896 sec)
INFO:tensorflow:lr = 7.774718e-05 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.9969
INFO:tensorflow:loss = 1.2421685, step = 163080 (7.699 sec)
INFO:tensorflow:lr = 7.766908e-05 (7.698 sec)
INFO:tensorflow:global_step/sec: 12.4813
INFO:tensorflow:loss = 1.2429278, step = 163180 (8.012 sec)
INFO:tensorflow:lr = 7.759106e-05 (8.012 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2018
INFO:tensorflow:loss = 1.2407615, step = 163280 (8.198 sec)
INFO:tensorflow:lr = 7.751311e-05 (8.200 sec)
INFO:tensorflow:global_step/sec: 10.6203
INFO:tensorflow:loss = 1.2463655, step = 163380 (9.414 sec)
INFO:tensorflow:lr = 7.743525e-05 (9.412 sec)
INFO:tensorflow:global_step/sec: 12.751
INFO:tensorflow:loss = 1.2475263, step = 163480 (7.838 sec)
INFO:tensorflow:lr = 7.7357465e-05 (7.840 sec)
INFO:tensorflow:global_step/sec: 12.8988
INFO:tensorflow:loss = 1.2489913, step = 163580 (7.759 sec)
INFO:tensorflow:lr = 7.7279765e-05 (7.758 sec)
INFO:tensorflow:global_step/sec: 12.7432
INFO:tensorflow:loss = 1.246935, step = 163680 (7.840 sec)
INFO:tensorflow:lr = 7.720213e-05 (7.840 sec)
INFO:tensorflow:global_step/sec: 12.7445
INFO:tensorflow:loss = 1.2567366, step = 163780 (7.846 sec)
INFO:tensorflow:lr = 7.7124576e-05 (7.852 sec)
INFO:tensorflow:global_step/sec: 12.6891
INFO:tensorflow:loss = 1.2523156, step = 163880 (7.886 sec)
INFO:tensorflow:lr = 7.704711e-05 (7.881 sec)
INFO:tensorflow:global_step/sec: 12.5144
INFO:tensorflow:loss = 1.2429801, step = 163980 (7.989 sec)
INFO:tensorflow:lr = 7.696971e-05 (7.989 sec)
INFO:tensorflow:global_step/sec: 12.7412
INFO:tensorflow:loss = 1.2436205, step = 164080 (7.852 sec)
INFO:tensorflow:lr = 7.689239e-05 (7.851 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.3508
INFO:tensorflow:loss = 1.2439187, step = 164180 (8.093 sec)
INFO:tensorflow:lr = 7.681516e-05 (8.093 sec)
INFO:tensorflow:global_step/sec: 10.8155
INFO:tensorflow:loss = 1.2418324, step = 164280 (9.247 sec)
INFO:tensorflow:lr = 7.673798e-05 (9.246 sec)
INFO:tensorflow:global_step/sec: 12.8791
INFO:tensorflow:loss = 1.2434556, step = 164380 (7.769 sec)
INFO:tensorflow:lr = 7.66609e-05 (7.770 sec)
INFO:tensorflow:global_step/sec: 12.7672
INFO:tensorflow:loss = 1.2411584, step = 164480 (7.824 sec)
INFO:tensorflow:lr = 7.658389e-05 (7.826 sec)
INFO:tensorflow:global_step/sec: 12.8412
INFO:tensorflow:loss = 1.243303, step = 164580 (7.787 sec)
INFO:tensorflow:lr = 7.650696e-05 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.6858
INFO:tensorflow:loss = 1.243237, step = 164680 (7.883 sec)
INFO:tensorflow:lr = 7.643011e-05 (7.882 sec)
INFO:tensorflow:global_step/sec: 12.7993
INFO:tensorflow:loss = 1.2468959, step = 164780 (7.819 sec)
INFO:tensorflow:lr = 7.6353324e-05 (7.819 sec)
INFO:tensorflow:global_step/sec: 12.9195
INFO:tensorflow:loss = 1.2466041, step = 164880 (7.735 sec)
INFO:tensorflow:lr = 7.627664e-05 (7.735 sec)
INFO:tensorflow:global_step/sec: 12.6698
INFO:tensorflow:loss = 1.2453058, step = 164980 (7.897 sec)
INFO:tensorflow:lr = 7.6200005e-05 (7.896 sec)
INFO:tensorflow:global_step/sec: 12.608
INFO:tensorflow:loss = 1.2435452, step = 165080 (7.932 sec)
INFO:tensorflow:lr = 7.612347e-05 (7.932 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.9524
INFO:tensorflow:loss = 1.2424791, step = 165180 (8.366 sec)
INFO:tensorflow:lr = 7.604699e-05 (8.367 sec)
INFO:tensorflow:global_step/sec: 11.3109
INFO:tensorflow:loss = 1.2438216, step = 165280 (8.836 sec)
INFO:tensorflow:lr = 7.597061e-05 (8.835 sec)
INFO:tensorflow:global_step/sec: 13.0587
INFO:tensorflow:loss = 1.2450823, step = 165380 (7.660 sec)
INFO:tensorflow:lr = 7.58943e-05 (7.662 sec)
INFO:tensorflow:global_step/sec: 12.7891
INFO:tensorflow:loss = 1.2420415, step = 165480 (7.818 sec)
INFO:tensorflow:lr = 7.5818054e-05 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.3887
INFO:tensorflow:loss = 1.2473958, step = 165580 (8.077 sec)
INFO:tensorflow:lr = 7.574189e-05 (8.072 sec)
INFO:tensorflow:global_step/sec: 12.3917
INFO:tensorflow:loss = 1.2471696, step = 165680 (8.069 sec)
INFO:tensorflow:lr = 7.566581e-05 (8.070 sec)
INFO:tensorflow:global_step/sec: 12.9346
INFO:tensorflow:loss = 1.2463306, step = 165780 (7.729 sec)
INFO:tensorflow:lr = 7.558979e-05 (7.728 sec)
INFO:tensorflow:global_step/sec: 12.6382
INFO:tensorflow:loss = 1.2409977, step = 165880 (7.917 sec)
INFO:tensorflow:lr = 7.551387e-05 (7.916 sec)
INFO:tensorflow:global_step/sec: 12.874
INFO:tensorflow:loss = 1.2447242, step = 165980 (7.764 sec)
INFO:tensorflow:lr = 7.5438e-05 (7.765 sec)
INFO:tensorflow:global_step/sec: 12.5758
INFO:tensorflow:loss = 1.2421839, step = 166080 (7.948 sec)
INFO:tensorflow:lr = 7.536224e-05 (7.948 sec)
INFO:tensorflow:global_step/sec: 12.8224
INFO:tensorflow:loss = 1.2433058, step = 166180 (7.799 sec)
INFO:tensorflow:lr = 7.528653e-05 (7.801 sec)
INFO:tensorflow:Saving checkpoints for 166260 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2428299.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-166260
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-166260
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.731
INFO:tensorflow:Best (Exact Match) Accuracy: 0.731
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-166260
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 166260 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2467928, step = 166260
INFO:tensorflow:lr = 7.522602e-05
INFO:tensorflow:global_step/sec: 9.96783
INFO:tensorflow:loss = 1.2433182, step = 166360 (10.039 sec)
INFO:tensorflow:lr = 7.5150456e-05 (10.038 sec)
INFO:tensorflow:global_step/sec: 12.6081
INFO:tensorflow:loss = 1.2423993, step = 166460 (7.930 sec)
INFO:tensorflow:lr = 7.507496e-05 (7.930 sec)
INFO:tensorflow:global_step/sec: 12.9082
INFO:tensorflow:loss = 1.2489258, step = 166560 (7.745 sec)
INFO:tensorflow:lr = 7.499954e-05 (7.745 sec)
INFO:tensorflow:global_step/sec: 12.7743
INFO:tensorflow:loss = 1.2423285, step = 166660 (7.827 sec)
INFO:tensorflow:lr = 7.492421e-05 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.5581
INFO:tensorflow:loss = 1.2450229, step = 166760 (7.962 sec)
INFO:tensorflow:lr = 7.484895e-05 (7.961 sec)
INFO:tensorflow:global_step/sec: 12.8234
INFO:tensorflow:loss = 1.2427442, step = 166860 (7.804 sec)
INFO:tensorflow:lr = 7.4773765e-05 (7.805 sec)
INFO:tensorflow:global_step/sec: 12.8935
INFO:tensorflow:loss = 1.243734, step = 166960 (7.754 sec)
INFO:tensorflow:lr = 7.469865e-05 (7.753 sec)
INFO:tensorflow:global_step/sec: 13.0232
INFO:tensorflow:loss = 1.243697, step = 167060 (7.676 sec)
INFO:tensorflow:lr = 7.4623604e-05 (7.675 sec)
INFO:tensorflow:global_step/sec: 12.8317
INFO:tensorflow:loss = 1.2420083, step = 167160 (7.793 sec)
INFO:tensorflow:lr = 7.454865e-05 (7.794 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.19419
INFO:tensorflow:loss = 1.2424514, step = 167260 (12.208 sec)
INFO:tensorflow:lr = 7.447377e-05 (12.208 sec)
INFO:tensorflow:global_step/sec: 12.8685
INFO:tensorflow:loss = 1.2442771, step = 167360 (7.766 sec)
INFO:tensorflow:lr = 7.4398966e-05 (7.768 sec)
INFO:tensorflow:global_step/sec: 12.7135
INFO:tensorflow:loss = 1.2463063, step = 167460 (7.866 sec)
INFO:tensorflow:lr = 7.432422e-05 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.8504
INFO:tensorflow:loss = 1.2478987, step = 167560 (7.782 sec)
INFO:tensorflow:lr = 7.424955e-05 (7.784 sec)
INFO:tensorflow:global_step/sec: 12.4762
INFO:tensorflow:loss = 1.2463549, step = 167660 (8.017 sec)
INFO:tensorflow:lr = 7.4174975e-05 (8.014 sec)
INFO:tensorflow:global_step/sec: 12.6068
INFO:tensorflow:loss = 1.243028, step = 167760 (7.935 sec)
INFO:tensorflow:lr = 7.4100455e-05 (7.936 sec)
INFO:tensorflow:global_step/sec: 12.7757
INFO:tensorflow:loss = 1.2428224, step = 167860 (7.827 sec)
INFO:tensorflow:lr = 7.402602e-05 (7.827 sec)
INFO:tensorflow:global_step/sec: 12.9328
INFO:tensorflow:loss = 1.2443757, step = 167960 (7.733 sec)
INFO:tensorflow:lr = 7.3951654e-05 (7.732 sec)
INFO:tensorflow:global_step/sec: 12.7784
INFO:tensorflow:loss = 1.242498, step = 168060 (7.827 sec)
INFO:tensorflow:lr = 7.387737e-05 (7.827 sec)
INFO:tensorflow:global_step/sec: 12.7597
INFO:tensorflow:loss = 1.246404, step = 168160 (7.835 sec)
INFO:tensorflow:lr = 7.380317e-05 (7.837 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.28793
INFO:tensorflow:loss = 1.2430749, step = 168260 (12.061 sec)
INFO:tensorflow:lr = 7.3729025e-05 (12.062 sec)
INFO:tensorflow:global_step/sec: 12.7741
INFO:tensorflow:loss = 1.2416666, step = 168360 (7.837 sec)
INFO:tensorflow:lr = 7.365496e-05 (7.835 sec)
INFO:tensorflow:global_step/sec: 12.6338
INFO:tensorflow:loss = 1.2404863, step = 168460 (7.911 sec)
INFO:tensorflow:lr = 7.358097e-05 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.8762
INFO:tensorflow:loss = 1.2460499, step = 168560 (7.765 sec)
INFO:tensorflow:lr = 7.3507064e-05 (7.767 sec)
INFO:tensorflow:global_step/sec: 12.6483
INFO:tensorflow:loss = 1.245742, step = 168660 (7.905 sec)
INFO:tensorflow:lr = 7.343323e-05 (7.904 sec)
INFO:tensorflow:global_step/sec: 12.7735
INFO:tensorflow:loss = 1.2437085, step = 168760 (7.827 sec)
INFO:tensorflow:lr = 7.335946e-05 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.7082
INFO:tensorflow:loss = 1.2422924, step = 168860 (7.873 sec)
INFO:tensorflow:lr = 7.3285766e-05 (7.873 sec)
INFO:tensorflow:global_step/sec: 12.9294
INFO:tensorflow:loss = 1.2445481, step = 168960 (7.737 sec)
INFO:tensorflow:lr = 7.321215e-05 (7.736 sec)
INFO:tensorflow:global_step/sec: 13.0217
INFO:tensorflow:loss = 1.2428153, step = 169060 (7.677 sec)
INFO:tensorflow:lr = 7.3138595e-05 (7.679 sec)
INFO:tensorflow:global_step/sec: 12.4694
INFO:tensorflow:loss = 1.24292, step = 169160 (8.022 sec)
INFO:tensorflow:lr = 7.306513e-05 (8.020 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.20923
INFO:tensorflow:loss = 1.2442397, step = 169260 (12.182 sec)
INFO:tensorflow:lr = 7.299173e-05 (12.182 sec)
INFO:tensorflow:global_step/sec: 12.6733
INFO:tensorflow:loss = 1.2442619, step = 169360 (7.886 sec)
INFO:tensorflow:lr = 7.291842e-05 (7.887 sec)
INFO:tensorflow:global_step/sec: 12.714
INFO:tensorflow:loss = 1.2440118, step = 169460 (7.871 sec)
INFO:tensorflow:lr = 7.284516e-05 (7.870 sec)
INFO:tensorflow:global_step/sec: 12.5632
INFO:tensorflow:loss = 1.2449383, step = 169560 (7.957 sec)
INFO:tensorflow:lr = 7.277198e-05 (7.959 sec)
INFO:tensorflow:global_step/sec: 12.7235
INFO:tensorflow:loss = 1.2519269, step = 169660 (7.862 sec)
INFO:tensorflow:lr = 7.269889e-05 (7.861 sec)
INFO:tensorflow:global_step/sec: 12.8846
INFO:tensorflow:loss = 1.2426889, step = 169760 (7.758 sec)
INFO:tensorflow:lr = 7.262586e-05 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.6476
INFO:tensorflow:loss = 1.2445718, step = 169860 (7.902 sec)
INFO:tensorflow:lr = 7.25529e-05 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.6015
INFO:tensorflow:loss = 1.242896, step = 169960 (7.939 sec)
INFO:tensorflow:lr = 7.248003e-05 (7.941 sec)
INFO:tensorflow:global_step/sec: 12.5507
INFO:tensorflow:loss = 1.2418842, step = 170060 (7.964 sec)
INFO:tensorflow:lr = 7.2407216e-05 (7.962 sec)
INFO:tensorflow:global_step/sec: 13.0502
INFO:tensorflow:loss = 1.2443966, step = 170160 (7.668 sec)
INFO:tensorflow:lr = 7.2334486e-05 (7.668 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.36448
INFO:tensorflow:loss = 1.2439117, step = 170260 (11.952 sec)
INFO:tensorflow:lr = 7.226182e-05 (11.954 sec)
INFO:tensorflow:global_step/sec: 12.879
INFO:tensorflow:loss = 1.2425317, step = 170360 (7.767 sec)
INFO:tensorflow:lr = 7.2189236e-05 (7.764 sec)
INFO:tensorflow:global_step/sec: 13.0269
INFO:tensorflow:loss = 1.243981, step = 170460 (7.677 sec)
INFO:tensorflow:lr = 7.2116716e-05 (7.677 sec)
INFO:tensorflow:global_step/sec: 12.7859
INFO:tensorflow:loss = 1.2428844, step = 170560 (7.824 sec)
INFO:tensorflow:lr = 7.204427e-05 (7.824 sec)
INFO:tensorflow:global_step/sec: 12.6076
INFO:tensorflow:loss = 1.2415282, step = 170660 (7.926 sec)
INFO:tensorflow:lr = 7.19719e-05 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.8436
INFO:tensorflow:loss = 1.242303, step = 170760 (7.788 sec)
INFO:tensorflow:lr = 7.189961e-05 (7.787 sec)
INFO:tensorflow:global_step/sec: 12.3776
INFO:tensorflow:loss = 1.2428727, step = 170860 (8.078 sec)
INFO:tensorflow:lr = 7.182739e-05 (8.080 sec)
INFO:tensorflow:global_step/sec: 12.614
INFO:tensorflow:loss = 1.245311, step = 170960 (7.930 sec)
INFO:tensorflow:lr = 7.1755225e-05 (7.928 sec)
INFO:tensorflow:global_step/sec: 12.8587
INFO:tensorflow:loss = 1.2429055, step = 171060 (7.771 sec)
INFO:tensorflow:lr = 7.1683135e-05 (7.774 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.60485
INFO:tensorflow:loss = 1.2450764, step = 171160 (11.623 sec)
INFO:tensorflow:lr = 7.161113e-05 (11.622 sec)
INFO:tensorflow:global_step/sec: 12.5893
INFO:tensorflow:loss = 1.2422101, step = 171260 (7.941 sec)
INFO:tensorflow:lr = 7.15392e-05 (7.941 sec)
INFO:tensorflow:global_step/sec: 12.1946
INFO:tensorflow:loss = 1.2442441, step = 171360 (8.204 sec)
INFO:tensorflow:lr = 7.1467344e-05 (8.203 sec)
INFO:tensorflow:global_step/sec: 12.5814
INFO:tensorflow:loss = 1.2420107, step = 171460 (7.948 sec)
INFO:tensorflow:lr = 7.139555e-05 (7.950 sec)
INFO:tensorflow:global_step/sec: 12.8204
INFO:tensorflow:loss = 1.2425112, step = 171560 (7.802 sec)
INFO:tensorflow:lr = 7.1323826e-05 (7.801 sec)
INFO:tensorflow:global_step/sec: 12.731
INFO:tensorflow:loss = 1.2440164, step = 171660 (7.851 sec)
INFO:tensorflow:lr = 7.125219e-05 (7.854 sec)
INFO:tensorflow:global_step/sec: 13.0197
INFO:tensorflow:loss = 1.2427493, step = 171760 (7.682 sec)
INFO:tensorflow:lr = 7.118061e-05 (7.678 sec)
INFO:tensorflow:global_step/sec: 12.7282
INFO:tensorflow:loss = 1.2409182, step = 171860 (7.854 sec)
INFO:tensorflow:lr = 7.1109105e-05 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.8746
INFO:tensorflow:loss = 1.2442806, step = 171960 (7.767 sec)
INFO:tensorflow:lr = 7.103767e-05 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.542
INFO:tensorflow:loss = 1.2414162, step = 172060 (7.973 sec)
INFO:tensorflow:lr = 7.0966315e-05 (7.971 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.09987
INFO:tensorflow:loss = 1.2424979, step = 172160 (10.990 sec)
INFO:tensorflow:lr = 7.089503e-05 (10.990 sec)
INFO:tensorflow:global_step/sec: 12.881
INFO:tensorflow:loss = 1.255378, step = 172260 (7.762 sec)
INFO:tensorflow:lr = 7.082381e-05 (7.762 sec)
INFO:tensorflow:global_step/sec: 12.6186
INFO:tensorflow:loss = 1.2428926, step = 172360 (7.925 sec)
INFO:tensorflow:lr = 7.075266e-05 (7.925 sec)
INFO:tensorflow:global_step/sec: 12.5197
INFO:tensorflow:loss = 1.2457323, step = 172460 (7.988 sec)
INFO:tensorflow:lr = 7.068159e-05 (7.988 sec)
INFO:tensorflow:global_step/sec: 13.1134
INFO:tensorflow:loss = 1.2408348, step = 172560 (7.625 sec)
INFO:tensorflow:lr = 7.0610586e-05 (7.625 sec)
INFO:tensorflow:global_step/sec: 12.8617
INFO:tensorflow:loss = 1.242487, step = 172660 (7.780 sec)
INFO:tensorflow:lr = 7.053967e-05 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.6416
INFO:tensorflow:loss = 1.2421248, step = 172760 (7.911 sec)
INFO:tensorflow:lr = 7.04688e-05 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.5986
INFO:tensorflow:loss = 1.240845, step = 172860 (7.934 sec)
INFO:tensorflow:lr = 7.0398026e-05 (7.934 sec)
INFO:tensorflow:global_step/sec: 12.9582
INFO:tensorflow:loss = 1.2410495, step = 172960 (7.721 sec)
INFO:tensorflow:lr = 7.0327296e-05 (7.721 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0786
INFO:tensorflow:loss = 1.2426779, step = 173060 (8.279 sec)
INFO:tensorflow:lr = 7.025665e-05 (8.280 sec)
INFO:tensorflow:global_step/sec: 10.6016
INFO:tensorflow:loss = 1.2406965, step = 173160 (9.433 sec)
INFO:tensorflow:lr = 7.0186084e-05 (9.432 sec)
INFO:tensorflow:global_step/sec: 12.9924
INFO:tensorflow:loss = 1.2419554, step = 173260 (7.695 sec)
INFO:tensorflow:lr = 7.0115566e-05 (7.697 sec)
INFO:tensorflow:global_step/sec: 12.6805
INFO:tensorflow:loss = 1.2415868, step = 173360 (7.886 sec)
INFO:tensorflow:lr = 7.004514e-05 (7.886 sec)
INFO:tensorflow:global_step/sec: 12.8956
INFO:tensorflow:loss = 1.2414397, step = 173460 (7.751 sec)
INFO:tensorflow:lr = 6.9974776e-05 (7.750 sec)
INFO:tensorflow:global_step/sec: 12.8402
INFO:tensorflow:loss = 1.2436533, step = 173560 (7.790 sec)
INFO:tensorflow:lr = 6.9904476e-05 (7.789 sec)
INFO:tensorflow:global_step/sec: 12.6078
INFO:tensorflow:loss = 1.2412962, step = 173660 (7.932 sec)
INFO:tensorflow:lr = 6.983426e-05 (7.932 sec)
INFO:tensorflow:global_step/sec: 12.9803
INFO:tensorflow:loss = 1.2563962, step = 173760 (7.706 sec)
INFO:tensorflow:lr = 6.976411e-05 (7.708 sec)
INFO:tensorflow:global_step/sec: 12.5698
INFO:tensorflow:loss = 1.2463813, step = 173860 (7.951 sec)
INFO:tensorflow:lr = 6.9694026e-05 (7.949 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.4643
INFO:tensorflow:loss = 1.2427906, step = 173960 (8.028 sec)
INFO:tensorflow:lr = 6.9624024e-05 (8.030 sec)
INFO:tensorflow:global_step/sec: 11.041
INFO:tensorflow:loss = 1.2439783, step = 174060 (9.053 sec)
INFO:tensorflow:lr = 6.955408e-05 (9.055 sec)
INFO:tensorflow:global_step/sec: 12.7311
INFO:tensorflow:loss = 1.2426528, step = 174160 (7.855 sec)
INFO:tensorflow:lr = 6.9484224e-05 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.6687
INFO:tensorflow:loss = 1.2417759, step = 174260 (7.896 sec)
INFO:tensorflow:lr = 6.941441e-05 (7.895 sec)
INFO:tensorflow:global_step/sec: 12.5623
INFO:tensorflow:loss = 1.2435216, step = 174360 (7.957 sec)
INFO:tensorflow:lr = 6.9344685e-05 (7.958 sec)
INFO:tensorflow:global_step/sec: 12.637
INFO:tensorflow:loss = 1.2440283, step = 174460 (7.913 sec)
INFO:tensorflow:lr = 6.927503e-05 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.9613
INFO:tensorflow:loss = 1.2432188, step = 174560 (7.722 sec)
INFO:tensorflow:lr = 6.920543e-05 (7.721 sec)
INFO:tensorflow:global_step/sec: 12.822
INFO:tensorflow:loss = 1.2439592, step = 174660 (7.798 sec)
INFO:tensorflow:lr = 6.9135924e-05 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.7043
INFO:tensorflow:loss = 1.2439635, step = 174760 (7.866 sec)
INFO:tensorflow:lr = 6.9066475e-05 (7.868 sec)
INFO:tensorflow:global_step/sec: 12.64
INFO:tensorflow:loss = 1.2470303, step = 174860 (7.913 sec)
INFO:tensorflow:lr = 6.899709e-05 (7.911 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.29
INFO:tensorflow:loss = 1.242181, step = 174960 (8.140 sec)
INFO:tensorflow:lr = 6.892779e-05 (8.147 sec)
INFO:tensorflow:global_step/sec: 11.6222
INFO:tensorflow:loss = 1.2408583, step = 175060 (8.603 sec)
INFO:tensorflow:lr = 6.8858535e-05 (8.596 sec)
INFO:tensorflow:global_step/sec: 12.5978
INFO:tensorflow:loss = 1.2463039, step = 175160 (7.941 sec)
INFO:tensorflow:lr = 6.878937e-05 (7.940 sec)
INFO:tensorflow:global_step/sec: 12.5607
INFO:tensorflow:loss = 1.2419947, step = 175260 (7.962 sec)
INFO:tensorflow:lr = 6.872027e-05 (7.962 sec)
INFO:tensorflow:global_step/sec: 12.602
INFO:tensorflow:loss = 1.2409464, step = 175360 (7.929 sec)
INFO:tensorflow:lr = 6.8651236e-05 (7.929 sec)
INFO:tensorflow:global_step/sec: 12.6779
INFO:tensorflow:loss = 1.2466931, step = 175460 (7.888 sec)
INFO:tensorflow:lr = 6.858228e-05 (7.888 sec)
INFO:tensorflow:global_step/sec: 12.8061
INFO:tensorflow:loss = 1.2410626, step = 175560 (7.814 sec)
INFO:tensorflow:lr = 6.8513385e-05 (7.814 sec)
INFO:tensorflow:global_step/sec: 12.7795
INFO:tensorflow:loss = 1.24094, step = 175660 (7.821 sec)
INFO:tensorflow:lr = 6.844457e-05 (7.822 sec)
INFO:tensorflow:global_step/sec: 12.6866
INFO:tensorflow:loss = 1.2434784, step = 175760 (7.881 sec)
INFO:tensorflow:lr = 6.8375804e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.7588
INFO:tensorflow:loss = 1.2445353, step = 175860 (7.841 sec)
INFO:tensorflow:lr = 6.830711e-05 (7.843 sec)
INFO:tensorflow:global_step/sec: 12.4546
INFO:tensorflow:loss = 1.2431968, step = 175960 (8.026 sec)
INFO:tensorflow:lr = 6.823851e-05 (8.025 sec)
INFO:tensorflow:Saving checkpoints for 176040 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2408674.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-176040
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-176040
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.728
INFO:tensorflow:Best (Exact Match) Accuracy: 0.731
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-176040
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 176040 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2436473, step = 176040
INFO:tensorflow:lr = 6.818367e-05
INFO:tensorflow:global_step/sec: 10.061
INFO:tensorflow:loss = 1.2422326, step = 176140 (9.946 sec)
INFO:tensorflow:lr = 6.811516e-05 (9.948 sec)
INFO:tensorflow:global_step/sec: 12.8098
INFO:tensorflow:loss = 1.2441524, step = 176240 (7.801 sec)
INFO:tensorflow:lr = 6.804675e-05 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.5074
INFO:tensorflow:loss = 1.2437139, step = 176340 (8.002 sec)
INFO:tensorflow:lr = 6.797839e-05 (8.002 sec)
INFO:tensorflow:global_step/sec: 12.7508
INFO:tensorflow:loss = 1.2430073, step = 176440 (7.841 sec)
INFO:tensorflow:lr = 6.791011e-05 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.9222
INFO:tensorflow:loss = 1.2443118, step = 176540 (7.736 sec)
INFO:tensorflow:lr = 6.784189e-05 (7.738 sec)
INFO:tensorflow:global_step/sec: 12.4978
INFO:tensorflow:loss = 1.2411668, step = 176640 (8.004 sec)
INFO:tensorflow:lr = 6.777373e-05 (8.002 sec)
INFO:tensorflow:global_step/sec: 12.7154
INFO:tensorflow:loss = 1.2438464, step = 176740 (7.867 sec)
INFO:tensorflow:lr = 6.770566e-05 (7.867 sec)
INFO:tensorflow:global_step/sec: 12.8534
INFO:tensorflow:loss = 1.2525758, step = 176840 (7.778 sec)
INFO:tensorflow:lr = 6.763765e-05 (7.778 sec)
INFO:tensorflow:global_step/sec: 12.7331
INFO:tensorflow:loss = 1.2458075, step = 176940 (7.850 sec)
INFO:tensorflow:lr = 6.756971e-05 (7.852 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.35251
INFO:tensorflow:loss = 1.2425443, step = 177040 (11.971 sec)
INFO:tensorflow:lr = 6.750183e-05 (11.970 sec)
INFO:tensorflow:global_step/sec: 12.608
INFO:tensorflow:loss = 1.2432464, step = 177140 (7.932 sec)
INFO:tensorflow:lr = 6.743402e-05 (7.932 sec)
INFO:tensorflow:global_step/sec: 12.7623
INFO:tensorflow:loss = 1.2433742, step = 177240 (7.836 sec)
INFO:tensorflow:lr = 6.736629e-05 (7.836 sec)
INFO:tensorflow:global_step/sec: 12.5755
INFO:tensorflow:loss = 1.2442988, step = 177340 (7.950 sec)
INFO:tensorflow:lr = 6.7298606e-05 (7.949 sec)
INFO:tensorflow:global_step/sec: 13.0362
INFO:tensorflow:loss = 1.2423884, step = 177440 (7.671 sec)
INFO:tensorflow:lr = 6.723101e-05 (7.672 sec)
INFO:tensorflow:global_step/sec: 12.882
INFO:tensorflow:loss = 1.2411859, step = 177540 (7.767 sec)
INFO:tensorflow:lr = 6.716346e-05 (7.767 sec)
INFO:tensorflow:global_step/sec: 12.7075
INFO:tensorflow:loss = 1.2438511, step = 177640 (7.866 sec)
INFO:tensorflow:lr = 6.7096e-05 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.7873
INFO:tensorflow:loss = 1.2472678, step = 177740 (7.824 sec)
INFO:tensorflow:lr = 6.70286e-05 (7.824 sec)
INFO:tensorflow:global_step/sec: 12.7072
INFO:tensorflow:loss = 1.2420048, step = 177840 (7.867 sec)
INFO:tensorflow:lr = 6.696127e-05 (7.866 sec)
INFO:tensorflow:global_step/sec: 12.8534
INFO:tensorflow:loss = 1.2439637, step = 177940 (7.783 sec)
INFO:tensorflow:lr = 6.6894005e-05 (7.783 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.30743
INFO:tensorflow:loss = 1.2429259, step = 178040 (12.035 sec)
INFO:tensorflow:lr = 6.6826804e-05 (12.035 sec)
INFO:tensorflow:global_step/sec: 12.8115
INFO:tensorflow:loss = 1.2417121, step = 178140 (7.803 sec)
INFO:tensorflow:lr = 6.675968e-05 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.819
INFO:tensorflow:loss = 1.2494624, step = 178240 (7.801 sec)
INFO:tensorflow:lr = 6.669262e-05 (7.799 sec)
INFO:tensorflow:global_step/sec: 13.0614
INFO:tensorflow:loss = 1.2493565, step = 178340 (7.655 sec)
INFO:tensorflow:lr = 6.662562e-05 (7.654 sec)
INFO:tensorflow:global_step/sec: 12.6056
INFO:tensorflow:loss = 1.2468174, step = 178440 (7.934 sec)
INFO:tensorflow:lr = 6.65587e-05 (7.937 sec)
INFO:tensorflow:global_step/sec: 12.802
INFO:tensorflow:loss = 1.2427741, step = 178540 (7.810 sec)
INFO:tensorflow:lr = 6.649183e-05 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.5317
INFO:tensorflow:loss = 1.2447419, step = 178640 (7.982 sec)
INFO:tensorflow:lr = 6.642503e-05 (7.981 sec)
INFO:tensorflow:global_step/sec: 12.833
INFO:tensorflow:loss = 1.242131, step = 178740 (7.790 sec)
INFO:tensorflow:lr = 6.635832e-05 (7.790 sec)
INFO:tensorflow:global_step/sec: 12.7559
INFO:tensorflow:loss = 1.2427136, step = 178840 (7.839 sec)
INFO:tensorflow:lr = 6.629166e-05 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.829
INFO:tensorflow:loss = 1.2427148, step = 178940 (7.800 sec)
INFO:tensorflow:lr = 6.6225075e-05 (7.800 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.35557
INFO:tensorflow:loss = 1.2481025, step = 179040 (11.968 sec)
INFO:tensorflow:lr = 6.615854e-05 (11.968 sec)
INFO:tensorflow:global_step/sec: 13.0739
INFO:tensorflow:loss = 1.2435266, step = 179140 (7.647 sec)
INFO:tensorflow:lr = 6.6092085e-05 (7.646 sec)
INFO:tensorflow:global_step/sec: 12.682
INFO:tensorflow:loss = 1.2475928, step = 179240 (7.882 sec)
INFO:tensorflow:lr = 6.60257e-05 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.5173
INFO:tensorflow:loss = 1.241785, step = 179340 (7.994 sec)
INFO:tensorflow:lr = 6.5959364e-05 (7.993 sec)
INFO:tensorflow:global_step/sec: 12.6721
INFO:tensorflow:loss = 1.241673, step = 179440 (7.892 sec)
INFO:tensorflow:lr = 6.589311e-05 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.9129
INFO:tensorflow:loss = 1.2435246, step = 179540 (7.745 sec)
INFO:tensorflow:lr = 6.582692e-05 (7.745 sec)
INFO:tensorflow:global_step/sec: 12.656
INFO:tensorflow:loss = 1.2441323, step = 179640 (7.900 sec)
INFO:tensorflow:lr = 6.576078e-05 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.9244
INFO:tensorflow:loss = 1.2419387, step = 179740 (7.732 sec)
INFO:tensorflow:lr = 6.569474e-05 (7.735 sec)
INFO:tensorflow:global_step/sec: 12.892
INFO:tensorflow:loss = 1.2468823, step = 179840 (7.758 sec)
INFO:tensorflow:lr = 6.5628745e-05 (7.756 sec)
INFO:tensorflow:global_step/sec: 12.6811
INFO:tensorflow:loss = 1.2426761, step = 179940 (7.884 sec)
INFO:tensorflow:lr = 6.556282e-05 (7.885 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.52812
INFO:tensorflow:loss = 1.2428222, step = 180040 (11.726 sec)
INFO:tensorflow:lr = 6.5496955e-05 (11.725 sec)
INFO:tensorflow:global_step/sec: 12.6168
INFO:tensorflow:loss = 1.2429457, step = 180140 (7.926 sec)
INFO:tensorflow:lr = 6.543116e-05 (7.928 sec)
INFO:tensorflow:global_step/sec: 12.7491
INFO:tensorflow:loss = 1.2432375, step = 180240 (7.847 sec)
INFO:tensorflow:lr = 6.5365435e-05 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.6939
INFO:tensorflow:loss = 1.242373, step = 180340 (7.881 sec)
INFO:tensorflow:lr = 6.529978e-05 (7.880 sec)
INFO:tensorflow:global_step/sec: 12.804
INFO:tensorflow:loss = 1.2414826, step = 180440 (7.805 sec)
INFO:tensorflow:lr = 6.523419e-05 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.7029
INFO:tensorflow:loss = 1.244215, step = 180540 (7.875 sec)
INFO:tensorflow:lr = 6.516865e-05 (7.874 sec)
INFO:tensorflow:global_step/sec: 12.8393
INFO:tensorflow:loss = 1.2461091, step = 180640 (7.786 sec)
INFO:tensorflow:lr = 6.510318e-05 (7.788 sec)
INFO:tensorflow:global_step/sec: 12.7857
INFO:tensorflow:loss = 1.2421577, step = 180740 (7.822 sec)
INFO:tensorflow:lr = 6.503779e-05 (7.822 sec)
INFO:tensorflow:global_step/sec: 13.0485
INFO:tensorflow:loss = 1.2420781, step = 180840 (7.668 sec)
INFO:tensorflow:lr = 6.497245e-05 (7.666 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.7315
INFO:tensorflow:loss = 1.2411906, step = 180940 (11.447 sec)
INFO:tensorflow:lr = 6.490719e-05 (11.447 sec)
INFO:tensorflow:global_step/sec: 12.7866
INFO:tensorflow:loss = 1.2427506, step = 181040 (7.825 sec)
INFO:tensorflow:lr = 6.484198e-05 (7.825 sec)
INFO:tensorflow:global_step/sec: 12.4139
INFO:tensorflow:loss = 1.2419596, step = 181140 (8.051 sec)
INFO:tensorflow:lr = 6.477685e-05 (8.051 sec)
INFO:tensorflow:global_step/sec: 12.7857
INFO:tensorflow:loss = 1.2428209, step = 181240 (7.821 sec)
INFO:tensorflow:lr = 6.4711785e-05 (7.822 sec)
INFO:tensorflow:global_step/sec: 12.76
INFO:tensorflow:loss = 1.242671, step = 181340 (7.837 sec)
INFO:tensorflow:lr = 6.464678e-05 (7.835 sec)
INFO:tensorflow:global_step/sec: 13.0807
INFO:tensorflow:loss = 1.2421178, step = 181440 (7.651 sec)
INFO:tensorflow:lr = 6.458184e-05 (7.651 sec)
INFO:tensorflow:global_step/sec: 12.8754
INFO:tensorflow:loss = 1.2421011, step = 181540 (7.763 sec)
INFO:tensorflow:lr = 6.4516964e-05 (7.764 sec)
INFO:tensorflow:global_step/sec: 12.3776
INFO:tensorflow:loss = 1.2435634, step = 181640 (8.076 sec)
INFO:tensorflow:lr = 6.445216e-05 (8.076 sec)
INFO:tensorflow:global_step/sec: 12.6016
INFO:tensorflow:loss = 1.2422757, step = 181740 (7.936 sec)
INFO:tensorflow:lr = 6.4387415e-05 (7.940 sec)
INFO:tensorflow:global_step/sec: 12.6405
INFO:tensorflow:loss = 1.2412153, step = 181840 (7.915 sec)
INFO:tensorflow:lr = 6.432273e-05 (7.911 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.44978
INFO:tensorflow:loss = 1.244641, step = 181940 (10.582 sec)
INFO:tensorflow:lr = 6.425812e-05 (10.582 sec)
INFO:tensorflow:global_step/sec: 13.0937
INFO:tensorflow:loss = 1.2411733, step = 182040 (7.638 sec)
INFO:tensorflow:lr = 6.419357e-05 (7.638 sec)
INFO:tensorflow:global_step/sec: 12.9868
INFO:tensorflow:loss = 1.2436959, step = 182140 (7.700 sec)
INFO:tensorflow:lr = 6.412908e-05 (7.700 sec)
INFO:tensorflow:global_step/sec: 12.7698
INFO:tensorflow:loss = 1.2463115, step = 182240 (7.826 sec)
INFO:tensorflow:lr = 6.406467e-05 (7.830 sec)
INFO:tensorflow:global_step/sec: 12.803
INFO:tensorflow:loss = 1.2440659, step = 182340 (7.816 sec)
INFO:tensorflow:lr = 6.4000305e-05 (7.812 sec)
INFO:tensorflow:global_step/sec: 12.522
INFO:tensorflow:loss = 1.2420621, step = 182440 (7.985 sec)
INFO:tensorflow:lr = 6.393602e-05 (7.985 sec)
INFO:tensorflow:global_step/sec: 12.4941
INFO:tensorflow:loss = 1.2414142, step = 182540 (8.005 sec)
INFO:tensorflow:lr = 6.387179e-05 (8.005 sec)
INFO:tensorflow:global_step/sec: 12.6789
INFO:tensorflow:loss = 1.2461977, step = 182640 (7.885 sec)
INFO:tensorflow:lr = 6.380763e-05 (7.886 sec)
INFO:tensorflow:global_step/sec: 13.0701
INFO:tensorflow:loss = 1.2416025, step = 182740 (7.654 sec)
INFO:tensorflow:lr = 6.3743544e-05 (7.652 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.29
INFO:tensorflow:loss = 1.2431751, step = 182840 (8.133 sec)
INFO:tensorflow:lr = 6.36795e-05 (8.136 sec)
INFO:tensorflow:global_step/sec: 10.6503
INFO:tensorflow:loss = 1.2422962, step = 182940 (9.393 sec)
INFO:tensorflow:lr = 6.361554e-05 (9.390 sec)
INFO:tensorflow:global_step/sec: 13.0235
INFO:tensorflow:loss = 1.2496976, step = 183040 (7.673 sec)
INFO:tensorflow:lr = 6.355163e-05 (7.677 sec)
INFO:tensorflow:global_step/sec: 12.6265
INFO:tensorflow:loss = 1.2432393, step = 183140 (7.924 sec)
INFO:tensorflow:lr = 6.348779e-05 (7.920 sec)
INFO:tensorflow:global_step/sec: 12.6644
INFO:tensorflow:loss = 1.243746, step = 183240 (7.891 sec)
INFO:tensorflow:lr = 6.342402e-05 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.7925
INFO:tensorflow:loss = 1.2410957, step = 183340 (7.817 sec)
INFO:tensorflow:lr = 6.3360305e-05 (7.818 sec)
INFO:tensorflow:global_step/sec: 13.0226
INFO:tensorflow:loss = 1.2438482, step = 183440 (7.684 sec)
INFO:tensorflow:lr = 6.329667e-05 (7.684 sec)
INFO:tensorflow:global_step/sec: 12.7638
INFO:tensorflow:loss = 1.245033, step = 183540 (7.835 sec)
INFO:tensorflow:lr = 6.3233085e-05 (7.835 sec)
INFO:tensorflow:global_step/sec: 12.7621
INFO:tensorflow:loss = 1.2443069, step = 183640 (7.837 sec)
INFO:tensorflow:lr = 6.316956e-05 (7.837 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.5158
INFO:tensorflow:loss = 1.2428632, step = 183740 (7.991 sec)
INFO:tensorflow:lr = 6.31061e-05 (7.990 sec)
INFO:tensorflow:global_step/sec: 11.0577
INFO:tensorflow:loss = 1.2430586, step = 183840 (9.036 sec)
INFO:tensorflow:lr = 6.304271e-05 (9.036 sec)
INFO:tensorflow:global_step/sec: 12.7589
INFO:tensorflow:loss = 1.242105, step = 183940 (7.842 sec)
INFO:tensorflow:lr = 6.297939e-05 (7.842 sec)
INFO:tensorflow:global_step/sec: 12.875
INFO:tensorflow:loss = 1.2421196, step = 184040 (7.770 sec)
INFO:tensorflow:lr = 6.2916115e-05 (7.770 sec)
INFO:tensorflow:global_step/sec: 12.8843
INFO:tensorflow:loss = 1.2427078, step = 184140 (7.759 sec)
INFO:tensorflow:lr = 6.285291e-05 (7.758 sec)
INFO:tensorflow:global_step/sec: 12.8214
INFO:tensorflow:loss = 1.2439513, step = 184240 (7.795 sec)
INFO:tensorflow:lr = 6.278978e-05 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.6415
INFO:tensorflow:loss = 1.2408562, step = 184340 (7.911 sec)
INFO:tensorflow:lr = 6.272671e-05 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.6495
INFO:tensorflow:loss = 1.2422056, step = 184440 (7.915 sec)
INFO:tensorflow:lr = 6.2663705e-05 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.7647
INFO:tensorflow:loss = 1.2462195, step = 184540 (7.828 sec)
INFO:tensorflow:lr = 6.260074e-05 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.8077
INFO:tensorflow:loss = 1.2462376, step = 184640 (7.804 sec)
INFO:tensorflow:lr = 6.253786e-05 (7.804 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1954
INFO:tensorflow:loss = 1.2416941, step = 184740 (8.206 sec)
INFO:tensorflow:lr = 6.247504e-05 (8.209 sec)
INFO:tensorflow:global_step/sec: 11.4304
INFO:tensorflow:loss = 1.243738, step = 184840 (8.742 sec)
INFO:tensorflow:lr = 6.2412284e-05 (8.739 sec)
INFO:tensorflow:global_step/sec: 12.7942
INFO:tensorflow:loss = 1.242184, step = 184940 (7.818 sec)
INFO:tensorflow:lr = 6.23496e-05 (7.818 sec)
INFO:tensorflow:global_step/sec: 12.5375
INFO:tensorflow:loss = 1.2413771, step = 185040 (7.977 sec)
INFO:tensorflow:lr = 6.2286956e-05 (7.977 sec)
INFO:tensorflow:global_step/sec: 12.7844
INFO:tensorflow:loss = 1.2429293, step = 185140 (7.819 sec)
INFO:tensorflow:lr = 6.222439e-05 (7.819 sec)
INFO:tensorflow:global_step/sec: 12.7958
INFO:tensorflow:loss = 1.245569, step = 185240 (7.820 sec)
INFO:tensorflow:lr = 6.216188e-05 (7.820 sec)
INFO:tensorflow:global_step/sec: 12.5349
INFO:tensorflow:loss = 1.240598, step = 185340 (7.979 sec)
INFO:tensorflow:lr = 6.209943e-05 (7.979 sec)
INFO:tensorflow:global_step/sec: 12.7825
INFO:tensorflow:loss = 1.2407473, step = 185440 (7.820 sec)
INFO:tensorflow:lr = 6.203707e-05 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.7777
INFO:tensorflow:loss = 1.24277, step = 185540 (7.826 sec)
INFO:tensorflow:lr = 6.1974744e-05 (7.825 sec)
INFO:tensorflow:global_step/sec: 12.9954
INFO:tensorflow:loss = 1.2449442, step = 185640 (7.693 sec)
INFO:tensorflow:lr = 6.1912484e-05 (7.693 sec)
INFO:tensorflow:global_step/sec: 12.6443
INFO:tensorflow:loss = 1.2449242, step = 185740 (7.907 sec)
INFO:tensorflow:lr = 6.1850296e-05 (7.907 sec)
INFO:tensorflow:Saving checkpoints for 185820 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.242429.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-185820
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-185820
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.732
INFO:tensorflow:Best (Exact Match) Accuracy: 0.732
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-185820
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 185820 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2430956, step = 185820
INFO:tensorflow:lr = 6.180058e-05
INFO:tensorflow:global_step/sec: 10.2397
INFO:tensorflow:loss = 1.2422625, step = 185920 (9.768 sec)
INFO:tensorflow:lr = 6.17385e-05 (9.768 sec)
INFO:tensorflow:global_step/sec: 12.5678
INFO:tensorflow:loss = 1.2413614, step = 186020 (7.957 sec)
INFO:tensorflow:lr = 6.167648e-05 (7.956 sec)
INFO:tensorflow:global_step/sec: 12.6587
INFO:tensorflow:loss = 1.242497, step = 186120 (7.899 sec)
INFO:tensorflow:lr = 6.1614526e-05 (7.899 sec)
INFO:tensorflow:global_step/sec: 13.0192
INFO:tensorflow:loss = 1.2470552, step = 186220 (7.683 sec)
INFO:tensorflow:lr = 6.155264e-05 (7.683 sec)
INFO:tensorflow:global_step/sec: 12.8884
INFO:tensorflow:loss = 1.2431347, step = 186320 (7.758 sec)
INFO:tensorflow:lr = 6.1490806e-05 (7.758 sec)
INFO:tensorflow:global_step/sec: 12.7696
INFO:tensorflow:loss = 1.2459142, step = 186420 (7.830 sec)
INFO:tensorflow:lr = 6.142903e-05 (7.832 sec)
INFO:tensorflow:global_step/sec: 12.9001
INFO:tensorflow:loss = 1.2413319, step = 186520 (7.754 sec)
INFO:tensorflow:lr = 6.136733e-05 (7.755 sec)
INFO:tensorflow:global_step/sec: 12.7284
INFO:tensorflow:loss = 1.2430797, step = 186620 (7.859 sec)
INFO:tensorflow:lr = 6.130568e-05 (7.856 sec)
INFO:tensorflow:global_step/sec: 12.3593
INFO:tensorflow:loss = 1.2427655, step = 186720 (8.087 sec)
INFO:tensorflow:lr = 6.12441e-05 (8.087 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.38791
INFO:tensorflow:loss = 1.2434381, step = 186820 (11.926 sec)
INFO:tensorflow:lr = 6.118258e-05 (11.926 sec)
INFO:tensorflow:global_step/sec: 12.7746
INFO:tensorflow:loss = 1.2431988, step = 186920 (7.828 sec)
INFO:tensorflow:lr = 6.1121114e-05 (7.828 sec)
INFO:tensorflow:global_step/sec: 12.3576
INFO:tensorflow:loss = 1.240415, step = 187020 (8.090 sec)
INFO:tensorflow:lr = 6.105973e-05 (8.092 sec)
INFO:tensorflow:global_step/sec: 12.5951
INFO:tensorflow:loss = 1.2401947, step = 187120 (7.938 sec)
INFO:tensorflow:lr = 6.0998384e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.5726
INFO:tensorflow:loss = 1.2473856, step = 187220 (7.957 sec)
INFO:tensorflow:lr = 6.0937105e-05 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.7697
INFO:tensorflow:loss = 1.2429252, step = 187320 (7.828 sec)
INFO:tensorflow:lr = 6.0875893e-05 (7.825 sec)
INFO:tensorflow:global_step/sec: 13.0692
INFO:tensorflow:loss = 1.2432778, step = 187420 (7.652 sec)
INFO:tensorflow:lr = 6.0814742e-05 (7.652 sec)
INFO:tensorflow:global_step/sec: 12.8313
INFO:tensorflow:loss = 1.24176, step = 187520 (7.793 sec)
INFO:tensorflow:lr = 6.075366e-05 (7.797 sec)
INFO:tensorflow:global_step/sec: 12.7361
INFO:tensorflow:loss = 1.2408872, step = 187620 (7.858 sec)
INFO:tensorflow:lr = 6.0692626e-05 (7.853 sec)
INFO:tensorflow:global_step/sec: 12.5969
INFO:tensorflow:loss = 1.2419, step = 187720 (7.933 sec)
INFO:tensorflow:lr = 6.0631653e-05 (7.934 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.32018
INFO:tensorflow:loss = 1.2422671, step = 187820 (12.022 sec)
INFO:tensorflow:lr = 6.0570757e-05 (12.021 sec)
INFO:tensorflow:global_step/sec: 13.0867
INFO:tensorflow:loss = 1.2460558, step = 187920 (7.638 sec)
INFO:tensorflow:lr = 6.05099e-05 (7.638 sec)
INFO:tensorflow:global_step/sec: 12.3994
INFO:tensorflow:loss = 1.2414271, step = 188020 (8.072 sec)
INFO:tensorflow:lr = 6.044912e-05 (8.072 sec)
INFO:tensorflow:global_step/sec: 12.533
INFO:tensorflow:loss = 1.2409451, step = 188120 (7.975 sec)
INFO:tensorflow:lr = 6.0388404e-05 (7.976 sec)
INFO:tensorflow:global_step/sec: 12.8062
INFO:tensorflow:loss = 1.2424439, step = 188220 (7.806 sec)
INFO:tensorflow:lr = 6.032773e-05 (7.805 sec)
INFO:tensorflow:global_step/sec: 12.7571
INFO:tensorflow:loss = 1.2418518, step = 188320 (7.842 sec)
INFO:tensorflow:lr = 6.0267135e-05 (7.841 sec)
INFO:tensorflow:global_step/sec: 12.7492
INFO:tensorflow:loss = 1.2417756, step = 188420 (7.845 sec)
INFO:tensorflow:lr = 6.0206596e-05 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.6351
INFO:tensorflow:loss = 1.2414497, step = 188520 (7.912 sec)
INFO:tensorflow:lr = 6.014612e-05 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.8196
INFO:tensorflow:loss = 1.242274, step = 188620 (7.805 sec)
INFO:tensorflow:lr = 6.0085706e-05 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.6623
INFO:tensorflow:loss = 1.2413298, step = 188720 (7.895 sec)
INFO:tensorflow:lr = 6.0025337e-05 (7.895 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.37098
INFO:tensorflow:loss = 1.241566, step = 188820 (11.942 sec)
INFO:tensorflow:lr = 5.996505e-05 (11.941 sec)
INFO:tensorflow:global_step/sec: 12.5102
INFO:tensorflow:loss = 1.2479603, step = 188920 (7.998 sec)
INFO:tensorflow:lr = 5.9904807e-05 (8.003 sec)
INFO:tensorflow:global_step/sec: 12.7268
INFO:tensorflow:loss = 1.2499129, step = 189020 (7.855 sec)
INFO:tensorflow:lr = 5.9844642e-05 (7.851 sec)
INFO:tensorflow:global_step/sec: 12.705
INFO:tensorflow:loss = 1.2405927, step = 189120 (7.875 sec)
INFO:tensorflow:lr = 5.9784517e-05 (7.875 sec)
INFO:tensorflow:global_step/sec: 12.8384
INFO:tensorflow:loss = 1.2449517, step = 189220 (7.784 sec)
INFO:tensorflow:lr = 5.9724454e-05 (7.784 sec)
INFO:tensorflow:global_step/sec: 12.8968
INFO:tensorflow:loss = 1.2450413, step = 189320 (7.756 sec)
INFO:tensorflow:lr = 5.9664464e-05 (7.758 sec)
INFO:tensorflow:global_step/sec: 12.9367
INFO:tensorflow:loss = 1.2425894, step = 189420 (7.727 sec)
INFO:tensorflow:lr = 5.960453e-05 (7.726 sec)
INFO:tensorflow:global_step/sec: 12.5036
INFO:tensorflow:loss = 1.2416962, step = 189520 (8.003 sec)
INFO:tensorflow:lr = 5.954466e-05 (8.003 sec)
INFO:tensorflow:global_step/sec: 12.7556
INFO:tensorflow:loss = 1.2433455, step = 189620 (7.835 sec)
INFO:tensorflow:lr = 5.948484e-05 (7.834 sec)
INFO:tensorflow:global_step/sec: 13.0041
INFO:tensorflow:loss = 1.2446123, step = 189720 (7.690 sec)
INFO:tensorflow:lr = 5.9425085e-05 (7.690 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.51546
INFO:tensorflow:loss = 1.2419295, step = 189820 (11.748 sec)
INFO:tensorflow:lr = 5.9365397e-05 (11.747 sec)
INFO:tensorflow:global_step/sec: 12.8369
INFO:tensorflow:loss = 1.2428107, step = 189920 (7.784 sec)
INFO:tensorflow:lr = 5.9305763e-05 (7.784 sec)
INFO:tensorflow:global_step/sec: 12.8227
INFO:tensorflow:loss = 1.2412173, step = 190020 (7.799 sec)
INFO:tensorflow:lr = 5.9246187e-05 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.8477
INFO:tensorflow:loss = 1.2426255, step = 190120 (7.788 sec)
INFO:tensorflow:lr = 5.918667e-05 (7.787 sec)
INFO:tensorflow:global_step/sec: 13.0337
INFO:tensorflow:loss = 1.2452132, step = 190220 (7.670 sec)
INFO:tensorflow:lr = 5.9127215e-05 (7.672 sec)
INFO:tensorflow:global_step/sec: 12.5826
INFO:tensorflow:loss = 1.2415522, step = 190320 (7.944 sec)
INFO:tensorflow:lr = 5.9067825e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.4786
INFO:tensorflow:loss = 1.2416269, step = 190420 (8.014 sec)
INFO:tensorflow:lr = 5.900849e-05 (8.015 sec)
INFO:tensorflow:global_step/sec: 12.8258
INFO:tensorflow:loss = 1.2427078, step = 190520 (7.804 sec)
INFO:tensorflow:lr = 5.894922e-05 (7.803 sec)
INFO:tensorflow:global_step/sec: 12.7805
INFO:tensorflow:loss = 1.2445235, step = 190620 (7.821 sec)
INFO:tensorflow:lr = 5.8889997e-05 (7.820 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.49193
INFO:tensorflow:loss = 1.247068, step = 190720 (11.774 sec)
INFO:tensorflow:lr = 5.883084e-05 (11.775 sec)
INFO:tensorflow:global_step/sec: 12.6129
INFO:tensorflow:loss = 1.2422463, step = 190820 (7.928 sec)
INFO:tensorflow:lr = 5.877174e-05 (7.929 sec)
INFO:tensorflow:global_step/sec: 12.6408
INFO:tensorflow:loss = 1.2405804, step = 190920 (7.911 sec)
INFO:tensorflow:lr = 5.8712703e-05 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.635
INFO:tensorflow:loss = 1.2446344, step = 191020 (7.914 sec)
INFO:tensorflow:lr = 5.8653728e-05 (7.914 sec)
INFO:tensorflow:global_step/sec: 12.713
INFO:tensorflow:loss = 1.2437266, step = 191120 (7.866 sec)
INFO:tensorflow:lr = 5.8594804e-05 (7.869 sec)
INFO:tensorflow:global_step/sec: 12.8576
INFO:tensorflow:loss = 1.2444649, step = 191220 (7.782 sec)
INFO:tensorflow:lr = 5.8535945e-05 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.7873
INFO:tensorflow:loss = 1.2414025, step = 191320 (7.821 sec)
INFO:tensorflow:lr = 5.847715e-05 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.5444
INFO:tensorflow:loss = 1.2417895, step = 191420 (7.970 sec)
INFO:tensorflow:lr = 5.8418398e-05 (7.970 sec)
INFO:tensorflow:global_step/sec: 12.6289
INFO:tensorflow:loss = 1.2412646, step = 191520 (7.916 sec)
INFO:tensorflow:lr = 5.835972e-05 (7.915 sec)
INFO:tensorflow:global_step/sec: 12.7265
INFO:tensorflow:loss = 1.2413337, step = 191620 (7.859 sec)
INFO:tensorflow:lr = 5.8301095e-05 (7.861 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.09703
INFO:tensorflow:loss = 1.2453784, step = 191720 (10.996 sec)
INFO:tensorflow:lr = 5.8242527e-05 (10.994 sec)
INFO:tensorflow:global_step/sec: 12.7438
INFO:tensorflow:loss = 1.2416813, step = 191820 (7.849 sec)
INFO:tensorflow:lr = 5.8184025e-05 (7.849 sec)
INFO:tensorflow:global_step/sec: 13.0111
INFO:tensorflow:loss = 1.2428048, step = 191920 (7.680 sec)
INFO:tensorflow:lr = 5.8125574e-05 (7.682 sec)
INFO:tensorflow:global_step/sec: 12.8564
INFO:tensorflow:loss = 1.2413689, step = 192020 (7.777 sec)
INFO:tensorflow:lr = 5.8067188e-05 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.5216
INFO:tensorflow:loss = 1.2429854, step = 192120 (7.986 sec)
INFO:tensorflow:lr = 5.8008867e-05 (7.982 sec)
INFO:tensorflow:global_step/sec: 12.8034
INFO:tensorflow:loss = 1.244082, step = 192220 (7.814 sec)
INFO:tensorflow:lr = 5.7950583e-05 (7.813 sec)
INFO:tensorflow:global_step/sec: 12.5927
INFO:tensorflow:loss = 1.2440885, step = 192320 (7.944 sec)
INFO:tensorflow:lr = 5.7892375e-05 (7.947 sec)
INFO:tensorflow:global_step/sec: 12.5696
INFO:tensorflow:loss = 1.2455595, step = 192420 (7.949 sec)
INFO:tensorflow:lr = 5.783422e-05 (7.948 sec)
INFO:tensorflow:global_step/sec: 12.8255
INFO:tensorflow:loss = 1.2410458, step = 192520 (7.797 sec)
INFO:tensorflow:lr = 5.7776128e-05 (7.796 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.2228
INFO:tensorflow:loss = 1.2421664, step = 192620 (8.181 sec)
INFO:tensorflow:lr = 5.771809e-05 (8.180 sec)
INFO:tensorflow:global_step/sec: 10.7852
INFO:tensorflow:loss = 1.2432908, step = 192720 (9.272 sec)
INFO:tensorflow:lr = 5.76601e-05 (9.272 sec)
INFO:tensorflow:global_step/sec: 12.9277
INFO:tensorflow:loss = 1.2420142, step = 192820 (7.736 sec)
INFO:tensorflow:lr = 5.7602185e-05 (7.736 sec)
INFO:tensorflow:global_step/sec: 13.0745
INFO:tensorflow:loss = 1.2412543, step = 192920 (7.649 sec)
INFO:tensorflow:lr = 5.7544326e-05 (7.649 sec)
INFO:tensorflow:global_step/sec: 12.769
INFO:tensorflow:loss = 1.2427813, step = 193020 (7.836 sec)
INFO:tensorflow:lr = 5.7486523e-05 (7.835 sec)
INFO:tensorflow:global_step/sec: 12.6918
INFO:tensorflow:loss = 1.2403716, step = 193120 (7.874 sec)
INFO:tensorflow:lr = 5.7428777e-05 (7.874 sec)
INFO:tensorflow:global_step/sec: 12.6062
INFO:tensorflow:loss = 1.2418182, step = 193220 (7.933 sec)
INFO:tensorflow:lr = 5.737108e-05 (7.932 sec)
INFO:tensorflow:global_step/sec: 12.3039
INFO:tensorflow:loss = 1.2434244, step = 193320 (8.128 sec)
INFO:tensorflow:lr = 5.7313453e-05 (8.129 sec)
INFO:tensorflow:global_step/sec: 12.7618
INFO:tensorflow:loss = 1.2468263, step = 193420 (7.836 sec)
INFO:tensorflow:lr = 5.7255882e-05 (7.835 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.9098
INFO:tensorflow:loss = 1.2425442, step = 193520 (7.748 sec)
INFO:tensorflow:lr = 5.719837e-05 (7.749 sec)
INFO:tensorflow:global_step/sec: 11.04
INFO:tensorflow:loss = 1.2404422, step = 193620 (9.060 sec)
INFO:tensorflow:lr = 5.7140904e-05 (9.059 sec)
INFO:tensorflow:global_step/sec: 12.8864
INFO:tensorflow:loss = 1.2420374, step = 193720 (7.763 sec)
INFO:tensorflow:lr = 5.7083504e-05 (7.763 sec)
INFO:tensorflow:global_step/sec: 12.6563
INFO:tensorflow:loss = 1.24243, step = 193820 (7.902 sec)
INFO:tensorflow:lr = 5.7026165e-05 (7.901 sec)
INFO:tensorflow:global_step/sec: 12.5789
INFO:tensorflow:loss = 1.2422926, step = 193920 (7.943 sec)
INFO:tensorflow:lr = 5.696888e-05 (7.944 sec)
INFO:tensorflow:global_step/sec: 12.7081
INFO:tensorflow:loss = 1.2414744, step = 194020 (7.869 sec)
INFO:tensorflow:lr = 5.6911656e-05 (7.868 sec)
INFO:tensorflow:global_step/sec: 12.9398
INFO:tensorflow:loss = 1.242649, step = 194120 (7.728 sec)
INFO:tensorflow:lr = 5.6854486e-05 (7.727 sec)
INFO:tensorflow:global_step/sec: 13.0157
INFO:tensorflow:loss = 1.2424544, step = 194220 (7.691 sec)
INFO:tensorflow:lr = 5.6797366e-05 (7.692 sec)
INFO:tensorflow:global_step/sec: 12.5769
INFO:tensorflow:loss = 1.2423269, step = 194320 (7.943 sec)
INFO:tensorflow:lr = 5.674032e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.6673
INFO:tensorflow:loss = 1.242586, step = 194420 (7.902 sec)
INFO:tensorflow:lr = 5.668332e-05 (7.902 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.923
INFO:tensorflow:loss = 1.2406418, step = 194520 (8.380 sec)
INFO:tensorflow:lr = 5.6626384e-05 (8.380 sec)
INFO:tensorflow:global_step/sec: 11.3406
INFO:tensorflow:loss = 1.2411753, step = 194620 (8.823 sec)
INFO:tensorflow:lr = 5.656949e-05 (8.823 sec)
INFO:tensorflow:global_step/sec: 12.7301
INFO:tensorflow:loss = 1.2445536, step = 194720 (7.855 sec)
INFO:tensorflow:lr = 5.6512672e-05 (7.859 sec)
INFO:tensorflow:global_step/sec: 12.9083
INFO:tensorflow:loss = 1.241786, step = 194820 (7.748 sec)
INFO:tensorflow:lr = 5.64559e-05 (7.743 sec)
INFO:tensorflow:global_step/sec: 12.7429
INFO:tensorflow:loss = 1.2426987, step = 194920 (7.845 sec)
INFO:tensorflow:lr = 5.639918e-05 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.804
INFO:tensorflow:loss = 1.2429112, step = 195020 (7.815 sec)
INFO:tensorflow:lr = 5.6342542e-05 (7.812 sec)
INFO:tensorflow:global_step/sec: 12.4789
INFO:tensorflow:loss = 1.2444768, step = 195120 (8.011 sec)
INFO:tensorflow:lr = 5.628594e-05 (8.012 sec)
INFO:tensorflow:global_step/sec: 12.7206
INFO:tensorflow:loss = 1.2421489, step = 195220 (7.856 sec)
INFO:tensorflow:lr = 5.62294e-05 (7.857 sec)
INFO:tensorflow:global_step/sec: 12.4673
INFO:tensorflow:loss = 1.2470261, step = 195320 (8.025 sec)
INFO:tensorflow:lr = 5.6172918e-05 (8.024 sec)
INFO:tensorflow:global_step/sec: 12.5697
INFO:tensorflow:loss = 1.243064, step = 195420 (7.954 sec)
INFO:tensorflow:lr = 5.6116485e-05 (7.954 sec)
INFO:tensorflow:global_step/sec: 12.7259
INFO:tensorflow:loss = 1.2425088, step = 195520 (7.854 sec)
INFO:tensorflow:lr = 5.6060122e-05 (7.859 sec)
INFO:tensorflow:Saving checkpoints for 195600 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2410872.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-195600
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-195600
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.733
INFO:tensorflow:Best (Exact Match) Accuracy: 0.733
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-195600
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 195600 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2424295, step = 195600
INFO:tensorflow:lr = 5.6015062e-05
INFO:tensorflow:global_step/sec: 10.1273
INFO:tensorflow:loss = 1.242512, step = 195700 (9.884 sec)
INFO:tensorflow:lr = 5.5958793e-05 (9.884 sec)
INFO:tensorflow:global_step/sec: 12.6818
INFO:tensorflow:loss = 1.2421359, step = 195800 (7.884 sec)
INFO:tensorflow:lr = 5.5902587e-05 (7.885 sec)
INFO:tensorflow:global_step/sec: 12.732
INFO:tensorflow:loss = 1.2427982, step = 195900 (7.855 sec)
INFO:tensorflow:lr = 5.584642e-05 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.7171
INFO:tensorflow:loss = 1.2436755, step = 196000 (7.861 sec)
INFO:tensorflow:lr = 5.5790315e-05 (7.860 sec)
INFO:tensorflow:global_step/sec: 12.8571
INFO:tensorflow:loss = 1.242795, step = 196100 (7.779 sec)
INFO:tensorflow:lr = 5.5734283e-05 (7.778 sec)
INFO:tensorflow:global_step/sec: 12.7439
INFO:tensorflow:loss = 1.2420249, step = 196200 (7.846 sec)
INFO:tensorflow:lr = 5.5678294e-05 (7.846 sec)
INFO:tensorflow:global_step/sec: 12.7956
INFO:tensorflow:loss = 1.2426386, step = 196300 (7.813 sec)
INFO:tensorflow:lr = 5.5622368e-05 (7.812 sec)
INFO:tensorflow:global_step/sec: 12.7607
INFO:tensorflow:loss = 1.2421803, step = 196400 (7.835 sec)
INFO:tensorflow:lr = 5.556649e-05 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.9493
INFO:tensorflow:loss = 1.2418551, step = 196500 (7.729 sec)
INFO:tensorflow:lr = 5.5510667e-05 (7.725 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.32006
INFO:tensorflow:loss = 1.2419361, step = 196600 (12.016 sec)
INFO:tensorflow:lr = 5.5454908e-05 (12.017 sec)
INFO:tensorflow:global_step/sec: 12.5265
INFO:tensorflow:loss = 1.2419522, step = 196700 (7.985 sec)
INFO:tensorflow:lr = 5.5399207e-05 (7.985 sec)
INFO:tensorflow:global_step/sec: 12.6023
INFO:tensorflow:loss = 1.2418892, step = 196800 (7.930 sec)
INFO:tensorflow:lr = 5.534356e-05 (7.929 sec)
INFO:tensorflow:global_step/sec: 12.79
INFO:tensorflow:loss = 1.2402346, step = 196900 (7.818 sec)
INFO:tensorflow:lr = 5.5287957e-05 (7.818 sec)
INFO:tensorflow:global_step/sec: 12.8103
INFO:tensorflow:loss = 1.242253, step = 197000 (7.807 sec)
INFO:tensorflow:lr = 5.5232424e-05 (7.807 sec)
INFO:tensorflow:global_step/sec: 12.9615
INFO:tensorflow:loss = 1.2404039, step = 197100 (7.719 sec)
INFO:tensorflow:lr = 5.517694e-05 (7.718 sec)
INFO:tensorflow:global_step/sec: 12.904
INFO:tensorflow:loss = 1.2524287, step = 197200 (7.751 sec)
INFO:tensorflow:lr = 5.5121516e-05 (7.751 sec)
INFO:tensorflow:global_step/sec: 12.6763
INFO:tensorflow:loss = 1.2418357, step = 197300 (7.887 sec)
INFO:tensorflow:lr = 5.506615e-05 (7.887 sec)
INFO:tensorflow:global_step/sec: 12.6131
INFO:tensorflow:loss = 1.2412477, step = 197400 (7.925 sec)
INFO:tensorflow:lr = 5.5010823e-05 (7.924 sec)
INFO:tensorflow:global_step/sec: 12.6833
INFO:tensorflow:loss = 1.2424623, step = 197500 (7.889 sec)
INFO:tensorflow:lr = 5.495556e-05 (7.890 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.2987
INFO:tensorflow:loss = 1.2423265, step = 197600 (12.045 sec)
INFO:tensorflow:lr = 5.4900363e-05 (12.046 sec)
INFO:tensorflow:global_step/sec: 13.031
INFO:tensorflow:loss = 1.2457525, step = 197700 (7.678 sec)
INFO:tensorflow:lr = 5.484521e-05 (7.679 sec)
INFO:tensorflow:global_step/sec: 12.9439
INFO:tensorflow:loss = 1.2480465, step = 197800 (7.721 sec)
INFO:tensorflow:lr = 5.4790125e-05 (7.720 sec)
INFO:tensorflow:global_step/sec: 12.7214
INFO:tensorflow:loss = 1.2456297, step = 197900 (7.862 sec)
INFO:tensorflow:lr = 5.4735083e-05 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.8302
INFO:tensorflow:loss = 1.2427973, step = 198000 (7.799 sec)
INFO:tensorflow:lr = 5.4680095e-05 (7.799 sec)
INFO:tensorflow:global_step/sec: 12.8085
INFO:tensorflow:loss = 1.2444547, step = 198100 (7.801 sec)
INFO:tensorflow:lr = 5.4625176e-05 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.8353
INFO:tensorflow:loss = 1.2432563, step = 198200 (7.796 sec)
INFO:tensorflow:lr = 5.4570293e-05 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.6867
INFO:tensorflow:loss = 1.2415416, step = 198300 (7.877 sec)
INFO:tensorflow:lr = 5.451548e-05 (7.878 sec)
INFO:tensorflow:global_step/sec: 12.7024
INFO:tensorflow:loss = 1.2426435, step = 198400 (7.873 sec)
INFO:tensorflow:lr = 5.446072e-05 (7.870 sec)
INFO:tensorflow:global_step/sec: 12.6592
INFO:tensorflow:loss = 1.2404841, step = 198500 (7.905 sec)
INFO:tensorflow:lr = 5.4406017e-05 (7.905 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.28541
INFO:tensorflow:loss = 1.2406154, step = 198600 (12.064 sec)
INFO:tensorflow:lr = 5.4351363e-05 (12.064 sec)
INFO:tensorflow:global_step/sec: 13.0017
INFO:tensorflow:loss = 1.2456881, step = 198700 (7.697 sec)
INFO:tensorflow:lr = 5.429676e-05 (7.697 sec)
INFO:tensorflow:global_step/sec: 12.81
INFO:tensorflow:loss = 1.2410623, step = 198800 (7.805 sec)
INFO:tensorflow:lr = 5.424222e-05 (7.806 sec)
INFO:tensorflow:global_step/sec: 12.8692
INFO:tensorflow:loss = 1.2445118, step = 198900 (7.766 sec)
INFO:tensorflow:lr = 5.4187738e-05 (7.766 sec)
INFO:tensorflow:global_step/sec: 12.7127
INFO:tensorflow:loss = 1.244541, step = 199000 (7.871 sec)
INFO:tensorflow:lr = 5.41333e-05 (7.870 sec)
INFO:tensorflow:global_step/sec: 12.7484
INFO:tensorflow:loss = 1.2432263, step = 199100 (7.845 sec)
INFO:tensorflow:lr = 5.407892e-05 (7.844 sec)
INFO:tensorflow:global_step/sec: 12.6662
INFO:tensorflow:loss = 1.2418202, step = 199200 (7.895 sec)
INFO:tensorflow:lr = 5.4024593e-05 (7.895 sec)
INFO:tensorflow:global_step/sec: 13.0052
INFO:tensorflow:loss = 1.2434285, step = 199300 (7.686 sec)
INFO:tensorflow:lr = 5.397033e-05 (7.687 sec)
INFO:tensorflow:global_step/sec: 12.6949
INFO:tensorflow:loss = 1.241352, step = 199400 (7.881 sec)
INFO:tensorflow:lr = 5.3916112e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.5404
INFO:tensorflow:loss = 1.2433487, step = 199500 (7.969 sec)
INFO:tensorflow:lr = 5.3861946e-05 (7.976 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.31808
INFO:tensorflow:loss = 1.2508881, step = 199600 (12.024 sec)
INFO:tensorflow:lr = 5.3807846e-05 (12.018 sec)
INFO:tensorflow:global_step/sec: 13.2693
INFO:tensorflow:loss = 1.2405204, step = 199700 (7.538 sec)
INFO:tensorflow:lr = 5.3753793e-05 (7.536 sec)
INFO:tensorflow:global_step/sec: 12.5754
INFO:tensorflow:loss = 1.2424177, step = 199800 (7.951 sec)
INFO:tensorflow:lr = 5.36998e-05 (7.952 sec)
INFO:tensorflow:global_step/sec: 12.7417
INFO:tensorflow:loss = 1.2406178, step = 199900 (7.850 sec)
INFO:tensorflow:lr = 5.3645854e-05 (7.849 sec)
INFO:tensorflow:global_step/sec: 12.8213
INFO:tensorflow:loss = 1.24702, step = 200000 (7.796 sec)
INFO:tensorflow:lr = 5.3591964e-05 (7.798 sec)
INFO:tensorflow:global_step/sec: 12.8796
INFO:tensorflow:loss = 1.2420019, step = 200100 (7.768 sec)
INFO:tensorflow:lr = 5.353813e-05 (7.768 sec)
INFO:tensorflow:global_step/sec: 12.8989
INFO:tensorflow:loss = 1.242649, step = 200200 (7.758 sec)
INFO:tensorflow:lr = 5.348435e-05 (7.756 sec)
INFO:tensorflow:global_step/sec: 12.8297
INFO:tensorflow:loss = 1.2412878, step = 200300 (7.793 sec)
INFO:tensorflow:lr = 5.3430627e-05 (7.793 sec)
INFO:tensorflow:global_step/sec: 12.7035
INFO:tensorflow:loss = 1.2421048, step = 200400 (7.865 sec)
INFO:tensorflow:lr = 5.3376953e-05 (7.868 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.50905
INFO:tensorflow:loss = 1.2434052, step = 200500 (11.754 sec)
INFO:tensorflow:lr = 5.332333e-05 (11.750 sec)
INFO:tensorflow:global_step/sec: 12.6036
INFO:tensorflow:loss = 1.2436012, step = 200600 (7.937 sec)
INFO:tensorflow:lr = 5.3269774e-05 (7.938 sec)
INFO:tensorflow:global_step/sec: 12.8985
INFO:tensorflow:loss = 1.2408528, step = 200700 (7.749 sec)
INFO:tensorflow:lr = 5.321626e-05 (7.748 sec)
INFO:tensorflow:global_step/sec: 12.7336
INFO:tensorflow:loss = 1.2421123, step = 200800 (7.852 sec)
INFO:tensorflow:lr = 5.316281e-05 (7.852 sec)
INFO:tensorflow:global_step/sec: 12.9262
INFO:tensorflow:loss = 1.242066, step = 200900 (7.738 sec)
INFO:tensorflow:lr = 5.31094e-05 (7.742 sec)
INFO:tensorflow:global_step/sec: 12.5781
INFO:tensorflow:loss = 1.2408648, step = 201000 (7.954 sec)
INFO:tensorflow:lr = 5.3056046e-05 (7.949 sec)
INFO:tensorflow:global_step/sec: 12.7527
INFO:tensorflow:loss = 1.2473798, step = 201100 (7.837 sec)
INFO:tensorflow:lr = 5.3002754e-05 (7.843 sec)
INFO:tensorflow:global_step/sec: 12.9835
INFO:tensorflow:loss = 1.2424769, step = 201200 (7.708 sec)
INFO:tensorflow:lr = 5.2949512e-05 (7.702 sec)
INFO:tensorflow:global_step/sec: 12.631
INFO:tensorflow:loss = 1.2482032, step = 201300 (7.916 sec)
INFO:tensorflow:lr = 5.2896325e-05 (7.915 sec)
INFO:tensorflow:global_step/sec: 12.6894
INFO:tensorflow:loss = 1.2401179, step = 201400 (7.875 sec)
INFO:tensorflow:lr = 5.284318e-05 (7.879 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.22447
INFO:tensorflow:loss = 1.2414714, step = 201500 (10.842 sec)
INFO:tensorflow:lr = 5.27901e-05 (10.838 sec)
INFO:tensorflow:global_step/sec: 12.8635
INFO:tensorflow:loss = 1.2402923, step = 201600 (7.779 sec)
INFO:tensorflow:lr = 5.2737072e-05 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.6169
INFO:tensorflow:loss = 1.2466598, step = 201700 (7.922 sec)
INFO:tensorflow:lr = 5.2684096e-05 (7.924 sec)
INFO:tensorflow:global_step/sec: 12.8282
INFO:tensorflow:loss = 1.2450514, step = 201800 (7.798 sec)
INFO:tensorflow:lr = 5.2631174e-05 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.8332
INFO:tensorflow:loss = 1.2427869, step = 201900 (7.791 sec)
INFO:tensorflow:lr = 5.2578303e-05 (7.792 sec)
INFO:tensorflow:global_step/sec: 12.8144
INFO:tensorflow:loss = 1.2411528, step = 202000 (7.804 sec)
INFO:tensorflow:lr = 5.2525484e-05 (7.805 sec)
INFO:tensorflow:global_step/sec: 12.8084
INFO:tensorflow:loss = 1.2449394, step = 202100 (7.808 sec)
INFO:tensorflow:lr = 5.2472726e-05 (7.806 sec)
INFO:tensorflow:global_step/sec: 12.7354
INFO:tensorflow:loss = 1.243877, step = 202200 (7.847 sec)
INFO:tensorflow:lr = 5.2420008e-05 (7.851 sec)
INFO:tensorflow:global_step/sec: 12.7724
INFO:tensorflow:loss = 1.243457, step = 202300 (7.833 sec)
INFO:tensorflow:lr = 5.236736e-05 (7.829 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0221
INFO:tensorflow:loss = 1.2485676, step = 202400 (8.321 sec)
INFO:tensorflow:lr = 5.231475e-05 (8.321 sec)
INFO:tensorflow:global_step/sec: 10.6252
INFO:tensorflow:loss = 1.2417319, step = 202500 (9.409 sec)
INFO:tensorflow:lr = 5.2262196e-05 (9.409 sec)
INFO:tensorflow:global_step/sec: 12.5426
INFO:tensorflow:loss = 1.2401463, step = 202600 (7.973 sec)
INFO:tensorflow:lr = 5.2209703e-05 (7.976 sec)
INFO:tensorflow:global_step/sec: 12.6906
INFO:tensorflow:loss = 1.2469463, step = 202700 (7.881 sec)
INFO:tensorflow:lr = 5.215725e-05 (7.878 sec)
INFO:tensorflow:global_step/sec: 12.7801
INFO:tensorflow:loss = 1.2424095, step = 202800 (7.823 sec)
INFO:tensorflow:lr = 5.2104864e-05 (7.824 sec)
INFO:tensorflow:global_step/sec: 12.8786
INFO:tensorflow:loss = 1.2429019, step = 202900 (7.765 sec)
INFO:tensorflow:lr = 5.205252e-05 (7.764 sec)
INFO:tensorflow:global_step/sec: 12.5697
INFO:tensorflow:loss = 1.2409177, step = 203000 (7.951 sec)
INFO:tensorflow:lr = 5.200023e-05 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.8791
INFO:tensorflow:loss = 1.2402259, step = 203100 (7.771 sec)
INFO:tensorflow:lr = 5.1948005e-05 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.87
INFO:tensorflow:loss = 1.2429622, step = 203200 (7.764 sec)
INFO:tensorflow:lr = 5.1895815e-05 (7.769 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.8056
INFO:tensorflow:loss = 1.2428799, step = 203300 (7.810 sec)
INFO:tensorflow:lr = 5.1843683e-05 (7.807 sec)
INFO:tensorflow:global_step/sec: 11.0626
INFO:tensorflow:loss = 1.2453337, step = 203400 (9.044 sec)
INFO:tensorflow:lr = 5.179161e-05 (9.044 sec)
INFO:tensorflow:global_step/sec: 12.7831
INFO:tensorflow:loss = 1.2423886, step = 203500 (7.823 sec)
INFO:tensorflow:lr = 5.173957e-05 (7.821 sec)
INFO:tensorflow:global_step/sec: 12.9267
INFO:tensorflow:loss = 1.2417992, step = 203600 (7.734 sec)
INFO:tensorflow:lr = 5.1687603e-05 (7.734 sec)
INFO:tensorflow:global_step/sec: 12.8584
INFO:tensorflow:loss = 1.2422185, step = 203700 (7.774 sec)
INFO:tensorflow:lr = 5.163568e-05 (7.774 sec)
INFO:tensorflow:global_step/sec: 12.9589
INFO:tensorflow:loss = 1.2430236, step = 203800 (7.721 sec)
INFO:tensorflow:lr = 5.1583815e-05 (7.722 sec)
INFO:tensorflow:global_step/sec: 13.0881
INFO:tensorflow:loss = 1.2422028, step = 203900 (7.641 sec)
INFO:tensorflow:lr = 5.1532e-05 (7.640 sec)
INFO:tensorflow:global_step/sec: 12.7424
INFO:tensorflow:loss = 1.244065, step = 204000 (7.842 sec)
INFO:tensorflow:lr = 5.1480227e-05 (7.842 sec)
INFO:tensorflow:global_step/sec: 12.5838
INFO:tensorflow:loss = 1.2406197, step = 204100 (7.949 sec)
INFO:tensorflow:lr = 5.142852e-05 (7.949 sec)
INFO:tensorflow:global_step/sec: 13.0673
INFO:tensorflow:loss = 1.2419794, step = 204200 (7.653 sec)
INFO:tensorflow:lr = 5.1376854e-05 (7.653 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.8192
INFO:tensorflow:loss = 1.2445016, step = 204300 (8.465 sec)
INFO:tensorflow:lr = 5.132525e-05 (8.469 sec)
INFO:tensorflow:global_step/sec: 11.1892
INFO:tensorflow:loss = 1.2439507, step = 204400 (8.934 sec)
INFO:tensorflow:lr = 5.127369e-05 (8.931 sec)
INFO:tensorflow:global_step/sec: 12.8959
INFO:tensorflow:loss = 1.2410576, step = 204500 (7.754 sec)
INFO:tensorflow:lr = 5.122218e-05 (7.753 sec)
INFO:tensorflow:global_step/sec: 12.7912
INFO:tensorflow:loss = 1.2469463, step = 204600 (7.819 sec)
INFO:tensorflow:lr = 5.117073e-05 (7.819 sec)
INFO:tensorflow:global_step/sec: 12.7463
INFO:tensorflow:loss = 1.2434845, step = 204700 (7.843 sec)
INFO:tensorflow:lr = 5.1119325e-05 (7.842 sec)
INFO:tensorflow:global_step/sec: 12.874
INFO:tensorflow:loss = 1.2412622, step = 204800 (7.767 sec)
INFO:tensorflow:lr = 5.1067982e-05 (7.772 sec)
INFO:tensorflow:global_step/sec: 12.964
INFO:tensorflow:loss = 1.2421836, step = 204900 (7.714 sec)
INFO:tensorflow:lr = 5.1016676e-05 (7.708 sec)
INFO:tensorflow:global_step/sec: 12.9155
INFO:tensorflow:loss = 1.2425599, step = 205000 (7.746 sec)
INFO:tensorflow:lr = 5.0965427e-05 (7.747 sec)
INFO:tensorflow:global_step/sec: 12.5868
INFO:tensorflow:loss = 1.2451409, step = 205100 (7.941 sec)
INFO:tensorflow:lr = 5.0914234e-05 (7.941 sec)
INFO:tensorflow:global_step/sec: 12.7319
INFO:tensorflow:loss = 1.2429577, step = 205200 (7.858 sec)
INFO:tensorflow:lr = 5.0863087e-05 (7.859 sec)
INFO:tensorflow:global_step/sec: 12.7461
INFO:tensorflow:loss = 1.2407069, step = 205300 (7.842 sec)
INFO:tensorflow:lr = 5.0812e-05 (7.844 sec)
INFO:tensorflow:Saving checkpoints for 205380 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2441876.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-205380
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-205380
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.729
INFO:tensorflow:Best (Exact Match) Accuracy: 0.733
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-205380
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 205380 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2418262, step = 205380
INFO:tensorflow:lr = 5.077116e-05
INFO:tensorflow:global_step/sec: 10.4309
INFO:tensorflow:loss = 1.243347, step = 205480 (9.594 sec)
INFO:tensorflow:lr = 5.0720155e-05 (9.593 sec)
INFO:tensorflow:global_step/sec: 12.4196
INFO:tensorflow:loss = 1.2491117, step = 205580 (8.050 sec)
INFO:tensorflow:lr = 5.0669198e-05 (8.046 sec)
INFO:tensorflow:global_step/sec: 12.5694
INFO:tensorflow:loss = 1.2417834, step = 205680 (7.960 sec)
INFO:tensorflow:lr = 5.0618306e-05 (7.960 sec)
INFO:tensorflow:global_step/sec: 12.727
INFO:tensorflow:loss = 1.2427137, step = 205780 (7.854 sec)
INFO:tensorflow:lr = 5.0567458e-05 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.9172
INFO:tensorflow:loss = 1.2439225, step = 205880 (7.743 sec)
INFO:tensorflow:lr = 5.0516664e-05 (7.742 sec)
INFO:tensorflow:global_step/sec: 12.8616
INFO:tensorflow:loss = 1.2396872, step = 205980 (7.769 sec)
INFO:tensorflow:lr = 5.0465915e-05 (7.769 sec)
INFO:tensorflow:global_step/sec: 12.8284
INFO:tensorflow:loss = 1.2469605, step = 206080 (7.800 sec)
INFO:tensorflow:lr = 5.0415223e-05 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.9143
INFO:tensorflow:loss = 1.2422843, step = 206180 (7.743 sec)
INFO:tensorflow:lr = 5.0364582e-05 (7.745 sec)
INFO:tensorflow:global_step/sec: 12.8145
INFO:tensorflow:loss = 1.2406392, step = 206280 (7.799 sec)
INFO:tensorflow:lr = 5.031399e-05 (7.798 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.21253
INFO:tensorflow:loss = 1.2431515, step = 206380 (12.183 sec)
INFO:tensorflow:lr = 5.026345e-05 (12.182 sec)
INFO:tensorflow:global_step/sec: 12.6628
INFO:tensorflow:loss = 1.2423357, step = 206480 (7.895 sec)
INFO:tensorflow:lr = 5.0212955e-05 (7.895 sec)
INFO:tensorflow:global_step/sec: 12.9072
INFO:tensorflow:loss = 1.2458041, step = 206580 (7.750 sec)
INFO:tensorflow:lr = 5.016251e-05 (7.752 sec)
INFO:tensorflow:global_step/sec: 12.6023
INFO:tensorflow:loss = 1.2403214, step = 206680 (7.929 sec)
INFO:tensorflow:lr = 5.011213e-05 (7.927 sec)
INFO:tensorflow:global_step/sec: 12.7342
INFO:tensorflow:loss = 1.24217, step = 206780 (7.857 sec)
INFO:tensorflow:lr = 5.006179e-05 (7.858 sec)
INFO:tensorflow:global_step/sec: 12.8234
INFO:tensorflow:loss = 1.2415317, step = 206880 (7.800 sec)
INFO:tensorflow:lr = 5.0011495e-05 (7.799 sec)
INFO:tensorflow:global_step/sec: 12.7469
INFO:tensorflow:loss = 1.2417748, step = 206980 (7.845 sec)
INFO:tensorflow:lr = 4.9961258e-05 (7.845 sec)
INFO:tensorflow:global_step/sec: 12.7289
INFO:tensorflow:loss = 1.2420164, step = 207080 (7.855 sec)
INFO:tensorflow:lr = 4.991107e-05 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.216
INFO:tensorflow:loss = 1.242654, step = 207180 (8.184 sec)
INFO:tensorflow:lr = 4.9860933e-05 (8.184 sec)
INFO:tensorflow:global_step/sec: 13.0354
INFO:tensorflow:loss = 1.241695, step = 207280 (7.668 sec)
INFO:tensorflow:lr = 4.9810842e-05 (7.668 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.23015
INFO:tensorflow:loss = 1.2435169, step = 207380 (12.156 sec)
INFO:tensorflow:lr = 4.9760813e-05 (12.156 sec)
INFO:tensorflow:global_step/sec: 12.9586
INFO:tensorflow:loss = 1.2414528, step = 207480 (7.718 sec)
INFO:tensorflow:lr = 4.9710827e-05 (7.718 sec)
INFO:tensorflow:global_step/sec: 12.6373
INFO:tensorflow:loss = 1.2421968, step = 207580 (7.911 sec)
INFO:tensorflow:lr = 4.9660885e-05 (7.912 sec)
INFO:tensorflow:global_step/sec: 12.6402
INFO:tensorflow:loss = 1.2409348, step = 207680 (7.906 sec)
INFO:tensorflow:lr = 4.9611004e-05 (7.906 sec)
INFO:tensorflow:global_step/sec: 12.7392
INFO:tensorflow:loss = 1.2412691, step = 207780 (7.854 sec)
INFO:tensorflow:lr = 4.9561164e-05 (7.854 sec)
INFO:tensorflow:global_step/sec: 12.943
INFO:tensorflow:loss = 1.244255, step = 207880 (7.722 sec)
INFO:tensorflow:lr = 4.9511385e-05 (7.725 sec)
INFO:tensorflow:global_step/sec: 12.7753
INFO:tensorflow:loss = 1.2425479, step = 207980 (7.832 sec)
INFO:tensorflow:lr = 4.9461647e-05 (7.829 sec)
INFO:tensorflow:global_step/sec: 12.9729
INFO:tensorflow:loss = 1.2428502, step = 208080 (7.704 sec)
INFO:tensorflow:lr = 4.9411956e-05 (7.704 sec)
INFO:tensorflow:global_step/sec: 12.7115
INFO:tensorflow:loss = 1.2472405, step = 208180 (7.868 sec)
INFO:tensorflow:lr = 4.9362327e-05 (7.868 sec)
INFO:tensorflow:global_step/sec: 12.7367
INFO:tensorflow:loss = 1.2415825, step = 208280 (7.851 sec)
INFO:tensorflow:lr = 4.931274e-05 (7.851 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.47069
INFO:tensorflow:loss = 1.2403713, step = 208380 (11.811 sec)
INFO:tensorflow:lr = 4.9263206e-05 (11.811 sec)
INFO:tensorflow:global_step/sec: 12.6213
INFO:tensorflow:loss = 1.2408, step = 208480 (7.922 sec)
INFO:tensorflow:lr = 4.921372e-05 (7.921 sec)
INFO:tensorflow:global_step/sec: 12.8692
INFO:tensorflow:loss = 1.2405838, step = 208580 (7.770 sec)
INFO:tensorflow:lr = 4.9164275e-05 (7.770 sec)
INFO:tensorflow:global_step/sec: 12.9359
INFO:tensorflow:loss = 1.2444116, step = 208680 (7.726 sec)
INFO:tensorflow:lr = 4.9114893e-05 (7.726 sec)
INFO:tensorflow:global_step/sec: 12.8071
INFO:tensorflow:loss = 1.2422515, step = 208780 (7.808 sec)
INFO:tensorflow:lr = 4.906555e-05 (7.812 sec)
INFO:tensorflow:global_step/sec: 12.4937
INFO:tensorflow:loss = 1.240635, step = 208880 (8.004 sec)
INFO:tensorflow:lr = 4.9016267e-05 (8.001 sec)
INFO:tensorflow:global_step/sec: 12.9984
INFO:tensorflow:loss = 1.2395564, step = 208980 (7.698 sec)
INFO:tensorflow:lr = 4.896703e-05 (7.696 sec)
INFO:tensorflow:global_step/sec: 12.6199
INFO:tensorflow:loss = 1.2414572, step = 209080 (7.924 sec)
INFO:tensorflow:lr = 4.8917842e-05 (7.925 sec)
INFO:tensorflow:global_step/sec: 12.6925
INFO:tensorflow:loss = 1.2428277, step = 209180 (7.880 sec)
INFO:tensorflow:lr = 4.8868704e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.7822
INFO:tensorflow:loss = 1.2430718, step = 209280 (7.825 sec)
INFO:tensorflow:lr = 4.8819613e-05 (7.825 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.37639
INFO:tensorflow:loss = 1.2407434, step = 209380 (11.932 sec)
INFO:tensorflow:lr = 4.8770577e-05 (11.932 sec)
INFO:tensorflow:global_step/sec: 12.6544
INFO:tensorflow:loss = 1.2410898, step = 209480 (7.902 sec)
INFO:tensorflow:lr = 4.8721577e-05 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.7381
INFO:tensorflow:loss = 1.2487592, step = 209580 (7.856 sec)
INFO:tensorflow:lr = 4.8672635e-05 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.5663
INFO:tensorflow:loss = 1.2414043, step = 209680 (7.959 sec)
INFO:tensorflow:lr = 4.8623744e-05 (7.960 sec)
INFO:tensorflow:global_step/sec: 12.5939
INFO:tensorflow:loss = 1.2406616, step = 209780 (7.936 sec)
INFO:tensorflow:lr = 4.85749e-05 (7.935 sec)
INFO:tensorflow:global_step/sec: 12.5459
INFO:tensorflow:loss = 1.2446214, step = 209880 (7.970 sec)
INFO:tensorflow:lr = 4.852611e-05 (7.971 sec)
INFO:tensorflow:global_step/sec: 12.5481
INFO:tensorflow:loss = 1.2434163, step = 209980 (7.968 sec)
INFO:tensorflow:lr = 4.8477363e-05 (7.968 sec)
INFO:tensorflow:global_step/sec: 12.76
INFO:tensorflow:loss = 1.2430301, step = 210080 (7.837 sec)
INFO:tensorflow:lr = 4.842866e-05 (7.837 sec)
INFO:tensorflow:global_step/sec: 12.5294
INFO:tensorflow:loss = 1.2408226, step = 210180 (7.987 sec)
INFO:tensorflow:lr = 4.8380018e-05 (7.987 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.5734
INFO:tensorflow:loss = 1.2454717, step = 210280 (11.673 sec)
INFO:tensorflow:lr = 4.8331414e-05 (11.673 sec)
INFO:tensorflow:global_step/sec: 12.6821
INFO:tensorflow:loss = 1.2445272, step = 210380 (7.877 sec)
INFO:tensorflow:lr = 4.828287e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.5257
INFO:tensorflow:loss = 1.2420585, step = 210480 (7.977 sec)
INFO:tensorflow:lr = 4.8234368e-05 (7.976 sec)
INFO:tensorflow:global_step/sec: 12.6337
INFO:tensorflow:loss = 1.2436208, step = 210580 (7.915 sec)
INFO:tensorflow:lr = 4.818591e-05 (7.915 sec)
INFO:tensorflow:global_step/sec: 12.8119
INFO:tensorflow:loss = 1.2423323, step = 210680 (7.811 sec)
INFO:tensorflow:lr = 4.813751e-05 (7.810 sec)
INFO:tensorflow:global_step/sec: 12.4684
INFO:tensorflow:loss = 1.2410481, step = 210780 (8.018 sec)
INFO:tensorflow:lr = 4.808915e-05 (8.018 sec)
INFO:tensorflow:global_step/sec: 12.8201
INFO:tensorflow:loss = 1.2407342, step = 210880 (7.797 sec)
INFO:tensorflow:lr = 4.804085e-05 (7.797 sec)
INFO:tensorflow:global_step/sec: 12.5921
INFO:tensorflow:loss = 1.2401924, step = 210980 (7.944 sec)
INFO:tensorflow:lr = 4.7992587e-05 (7.945 sec)
INFO:tensorflow:global_step/sec: 12.7187
INFO:tensorflow:loss = 1.2426429, step = 211080 (7.862 sec)
INFO:tensorflow:lr = 4.7944373e-05 (7.862 sec)
INFO:tensorflow:global_step/sec: 12.6319
INFO:tensorflow:loss = 1.2419528, step = 211180 (7.915 sec)
INFO:tensorflow:lr = 4.7896217e-05 (7.915 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.23778
INFO:tensorflow:loss = 1.2429737, step = 211280 (10.830 sec)
INFO:tensorflow:lr = 4.7848105e-05 (10.831 sec)
INFO:tensorflow:global_step/sec: 12.8513
INFO:tensorflow:loss = 1.2444791, step = 211380 (7.780 sec)
INFO:tensorflow:lr = 4.7800044e-05 (7.780 sec)
INFO:tensorflow:global_step/sec: 12.8092
INFO:tensorflow:loss = 1.2424067, step = 211480 (7.810 sec)
INFO:tensorflow:lr = 4.7752023e-05 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.8037
INFO:tensorflow:loss = 1.2412364, step = 211580 (7.805 sec)
INFO:tensorflow:lr = 4.770405e-05 (7.809 sec)
INFO:tensorflow:global_step/sec: 12.5397
INFO:tensorflow:loss = 1.2432137, step = 211680 (7.979 sec)
INFO:tensorflow:lr = 4.7656133e-05 (7.975 sec)
INFO:tensorflow:global_step/sec: 13.0206
INFO:tensorflow:loss = 1.2420354, step = 211780 (7.676 sec)
INFO:tensorflow:lr = 4.760826e-05 (7.677 sec)
INFO:tensorflow:global_step/sec: 12.9015
INFO:tensorflow:loss = 1.2408917, step = 211880 (7.751 sec)
INFO:tensorflow:lr = 4.7560436e-05 (7.751 sec)
INFO:tensorflow:global_step/sec: 12.671
INFO:tensorflow:loss = 1.24008, step = 211980 (7.889 sec)
INFO:tensorflow:lr = 4.751266e-05 (7.889 sec)
INFO:tensorflow:global_step/sec: 12.6053
INFO:tensorflow:loss = 1.2407787, step = 212080 (7.933 sec)
INFO:tensorflow:lr = 4.746493e-05 (7.933 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1759
INFO:tensorflow:loss = 1.240133, step = 212180 (8.213 sec)
INFO:tensorflow:lr = 4.7417256e-05 (8.220 sec)
INFO:tensorflow:global_step/sec: 10.5411
INFO:tensorflow:loss = 1.242667, step = 212280 (9.488 sec)
INFO:tensorflow:lr = 4.7369624e-05 (9.481 sec)
INFO:tensorflow:global_step/sec: 12.9632
INFO:tensorflow:loss = 1.2408278, step = 212380 (7.713 sec)
INFO:tensorflow:lr = 4.732204e-05 (7.718 sec)
INFO:tensorflow:global_step/sec: 12.693
INFO:tensorflow:loss = 1.2441196, step = 212480 (7.878 sec)
INFO:tensorflow:lr = 4.7274498e-05 (7.873 sec)
INFO:tensorflow:global_step/sec: 12.7106
INFO:tensorflow:loss = 1.242603, step = 212580 (7.874 sec)
INFO:tensorflow:lr = 4.722701e-05 (7.873 sec)
INFO:tensorflow:global_step/sec: 12.5065
INFO:tensorflow:loss = 1.2410915, step = 212680 (7.990 sec)
INFO:tensorflow:lr = 4.7179576e-05 (7.991 sec)
INFO:tensorflow:global_step/sec: 12.6562
INFO:tensorflow:loss = 1.2419416, step = 212780 (7.907 sec)
INFO:tensorflow:lr = 4.7132176e-05 (7.906 sec)
INFO:tensorflow:global_step/sec: 12.3483
INFO:tensorflow:loss = 1.2452627, step = 212880 (8.097 sec)
INFO:tensorflow:lr = 4.708484e-05 (8.097 sec)
INFO:tensorflow:global_step/sec: 12.5276
INFO:tensorflow:loss = 1.2399526, step = 212980 (7.982 sec)
INFO:tensorflow:lr = 4.7037538e-05 (7.982 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.5239
INFO:tensorflow:loss = 1.2448621, step = 213080 (7.982 sec)
INFO:tensorflow:lr = 4.6990284e-05 (7.982 sec)
INFO:tensorflow:global_step/sec: 10.8555
INFO:tensorflow:loss = 1.2401872, step = 213180 (9.216 sec)
INFO:tensorflow:lr = 4.6943085e-05 (9.216 sec)
INFO:tensorflow:global_step/sec: 12.6474
INFO:tensorflow:loss = 1.2426721, step = 213280 (7.907 sec)
INFO:tensorflow:lr = 4.6895926e-05 (7.907 sec)
INFO:tensorflow:global_step/sec: 13.0417
INFO:tensorflow:loss = 1.2432199, step = 213380 (7.663 sec)
INFO:tensorflow:lr = 4.684882e-05 (7.665 sec)
INFO:tensorflow:global_step/sec: 12.7907
INFO:tensorflow:loss = 1.2436359, step = 213480 (7.821 sec)
INFO:tensorflow:lr = 4.6801757e-05 (7.820 sec)
INFO:tensorflow:global_step/sec: 12.6265
INFO:tensorflow:loss = 1.239592, step = 213580 (7.915 sec)
INFO:tensorflow:lr = 4.6754736e-05 (7.915 sec)
INFO:tensorflow:global_step/sec: 11.9851
INFO:tensorflow:loss = 1.2443177, step = 213680 (8.343 sec)
INFO:tensorflow:lr = 4.6707773e-05 (8.343 sec)
INFO:tensorflow:global_step/sec: 12.5796
INFO:tensorflow:loss = 1.2432239, step = 213780 (7.951 sec)
INFO:tensorflow:lr = 4.666086e-05 (7.951 sec)
INFO:tensorflow:global_step/sec: 12.4314
INFO:tensorflow:loss = 1.2420282, step = 213880 (8.047 sec)
INFO:tensorflow:lr = 4.661399e-05 (8.047 sec)
INFO:tensorflow:global_step/sec: 12.4872
INFO:tensorflow:loss = 1.2413042, step = 213980 (8.008 sec)
INFO:tensorflow:lr = 4.6567162e-05 (8.007 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.6035
INFO:tensorflow:loss = 1.2453946, step = 214080 (8.632 sec)
INFO:tensorflow:lr = 4.6520378e-05 (8.633 sec)
INFO:tensorflow:global_step/sec: 11.1427
INFO:tensorflow:loss = 1.241159, step = 214180 (8.963 sec)
INFO:tensorflow:lr = 4.647365e-05 (8.962 sec)
INFO:tensorflow:global_step/sec: 12.6876
INFO:tensorflow:loss = 1.240063, step = 214280 (7.880 sec)
INFO:tensorflow:lr = 4.642696e-05 (7.881 sec)
INFO:tensorflow:global_step/sec: 12.1038
INFO:tensorflow:loss = 1.2410262, step = 214380 (8.263 sec)
INFO:tensorflow:lr = 4.638033e-05 (8.263 sec)
INFO:tensorflow:global_step/sec: 12.6095
INFO:tensorflow:loss = 1.2421927, step = 214480 (7.929 sec)
INFO:tensorflow:lr = 4.6333746e-05 (7.932 sec)
INFO:tensorflow:global_step/sec: 12.2797
INFO:tensorflow:loss = 1.2429354, step = 214580 (8.144 sec)
INFO:tensorflow:lr = 4.6287194e-05 (8.142 sec)
INFO:tensorflow:global_step/sec: 12.4471
INFO:tensorflow:loss = 1.2444017, step = 214680 (8.029 sec)
INFO:tensorflow:lr = 4.6240704e-05 (8.028 sec)
INFO:tensorflow:global_step/sec: 12.5796
INFO:tensorflow:loss = 1.2418594, step = 214780 (7.949 sec)
INFO:tensorflow:lr = 4.6194247e-05 (7.953 sec)
INFO:tensorflow:global_step/sec: 12.1706
INFO:tensorflow:loss = 1.2411361, step = 214880 (8.217 sec)
INFO:tensorflow:lr = 4.614785e-05 (8.213 sec)
INFO:tensorflow:global_step/sec: 12.3648
INFO:tensorflow:loss = 1.2421589, step = 214980 (8.087 sec)
INFO:tensorflow:lr = 4.610149e-05 (8.087 sec)
INFO:tensorflow:global_step/sec: 12.6355
INFO:tensorflow:loss = 1.240195, step = 215080 (7.914 sec)
INFO:tensorflow:lr = 4.605517e-05 (7.915 sec)
INFO:tensorflow:Saving checkpoints for 215160 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2434119.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-215160
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-215160
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.731
INFO:tensorflow:Best (Exact Match) Accuracy: 0.733
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-215160
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 215160 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.2435311, step = 215160
INFO:tensorflow:lr = 4.601817e-05
INFO:tensorflow:global_step/sec: 9.90966
INFO:tensorflow:loss = 1.242061, step = 215260 (10.099 sec)
INFO:tensorflow:lr = 4.5971938e-05 (10.099 sec)
INFO:tensorflow:global_step/sec: 12.3753
INFO:tensorflow:loss = 1.2418321, step = 215360 (8.078 sec)
INFO:tensorflow:lr = 4.5925754e-05 (8.078 sec)
INFO:tensorflow:global_step/sec: 12.8241
INFO:tensorflow:loss = 1.2416762, step = 215460 (7.797 sec)
INFO:tensorflow:lr = 4.5879624e-05 (7.796 sec)
INFO:tensorflow:global_step/sec: 12.4313
INFO:tensorflow:loss = 1.2419561, step = 215560 (8.047 sec)
INFO:tensorflow:lr = 4.5833534e-05 (8.047 sec)
INFO:tensorflow:global_step/sec: 12.3863
INFO:tensorflow:loss = 1.2430488, step = 215660 (8.068 sec)
INFO:tensorflow:lr = 4.5787496e-05 (8.068 sec)
INFO:tensorflow:global_step/sec: 12.0618
INFO:tensorflow:loss = 1.2430937, step = 215760 (8.296 sec)
INFO:tensorflow:lr = 4.5741504e-05 (8.295 sec)
INFO:tensorflow:global_step/sec: 12.3146
INFO:tensorflow:loss = 1.2398549, step = 215860 (8.119 sec)
INFO:tensorflow:lr = 4.569555e-05 (8.119 sec)
INFO:tensorflow:global_step/sec: 12.3494
INFO:tensorflow:loss = 1.2440462, step = 215960 (8.097 sec)
INFO:tensorflow:lr = 4.5649653e-05 (8.098 sec)
INFO:tensorflow:global_step/sec: 11.9267
INFO:tensorflow:loss = 1.242953, step = 216060 (8.387 sec)
INFO:tensorflow:lr = 4.5603792e-05 (8.386 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.87687
INFO:tensorflow:loss = 1.2415045, step = 216160 (12.694 sec)
INFO:tensorflow:lr = 4.5557987e-05 (12.695 sec)
INFO:tensorflow:global_step/sec: 12.3866
INFO:tensorflow:loss = 1.2421069, step = 216260 (8.074 sec)
INFO:tensorflow:lr = 4.551222e-05 (8.073 sec)
INFO:tensorflow:global_step/sec: 12.3103
INFO:tensorflow:loss = 1.2413859, step = 216360 (8.119 sec)
INFO:tensorflow:lr = 4.54665e-05 (8.119 sec)
INFO:tensorflow:global_step/sec: 12.2992
INFO:tensorflow:loss = 1.2421327, step = 216460 (8.135 sec)
INFO:tensorflow:lr = 4.542083e-05 (8.135 sec)
INFO:tensorflow:global_step/sec: 12.0773
INFO:tensorflow:loss = 1.2416039, step = 216560 (8.275 sec)
INFO:tensorflow:lr = 4.5375204e-05 (8.276 sec)
INFO:tensorflow:global_step/sec: 12.3892
INFO:tensorflow:loss = 1.240614, step = 216660 (8.071 sec)
INFO:tensorflow:lr = 4.5329627e-05 (8.070 sec)
INFO:tensorflow:global_step/sec: 12.207
INFO:tensorflow:loss = 1.2392285, step = 216760 (8.192 sec)
INFO:tensorflow:lr = 4.5284087e-05 (8.192 sec)
INFO:tensorflow:global_step/sec: 12.5466
INFO:tensorflow:loss = 1.2417903, step = 216860 (7.970 sec)
INFO:tensorflow:lr = 4.5238594e-05 (7.970 sec)
INFO:tensorflow:global_step/sec: 12.5423
INFO:tensorflow:loss = 1.2406605, step = 216960 (7.978 sec)
INFO:tensorflow:lr = 4.5193156e-05 (7.978 sec)
INFO:tensorflow:global_step/sec: 12.2379
INFO:tensorflow:loss = 1.2422897, step = 217060 (8.168 sec)
INFO:tensorflow:lr = 4.5147754e-05 (8.168 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.96771
INFO:tensorflow:loss = 1.2423333, step = 217160 (12.550 sec)
INFO:tensorflow:lr = 4.5102406e-05 (12.552 sec)
INFO:tensorflow:global_step/sec: 12.0423
INFO:tensorflow:loss = 1.2417514, step = 217260 (8.305 sec)
INFO:tensorflow:lr = 4.5057095e-05 (8.306 sec)
INFO:tensorflow:global_step/sec: 12.3714
INFO:tensorflow:loss = 1.2436274, step = 217360 (8.085 sec)
INFO:tensorflow:lr = 4.5011835e-05 (8.092 sec)
INFO:tensorflow:global_step/sec: 12.0762
INFO:tensorflow:loss = 1.2410803, step = 217460 (8.278 sec)
INFO:tensorflow:lr = 4.4966622e-05 (8.273 sec)
INFO:tensorflow:global_step/sec: 12.4341
INFO:tensorflow:loss = 1.2418171, step = 217560 (8.047 sec)
INFO:tensorflow:lr = 4.492145e-05 (8.045 sec)
INFO:tensorflow:global_step/sec: 12.1051
INFO:tensorflow:loss = 1.2409146, step = 217660 (8.255 sec)
INFO:tensorflow:lr = 4.487633e-05 (8.257 sec)
INFO:tensorflow:global_step/sec: 12.5272
INFO:tensorflow:loss = 1.241607, step = 217760 (7.989 sec)
INFO:tensorflow:lr = 4.483125e-05 (7.986 sec)
INFO:tensorflow:global_step/sec: 12.4025
INFO:tensorflow:loss = 1.241136, step = 217860 (8.062 sec)
INFO:tensorflow:lr = 4.478621e-05 (8.062 sec)
INFO:tensorflow:global_step/sec: 12.2296
INFO:tensorflow:loss = 1.2414784, step = 217960 (8.176 sec)
INFO:tensorflow:lr = 4.4741224e-05 (8.176 sec)
INFO:tensorflow:global_step/sec: 12.5104
INFO:tensorflow:loss = 1.2465246, step = 218060 (7.991 sec)
INFO:tensorflow:lr = 4.469628e-05 (7.992 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 7.8534
INFO:tensorflow:loss = 1.2407348, step = 218160 (12.731 sec)
INFO:tensorflow:lr = 4.4651384e-05 (12.732 sec)
INFO:tensorflow:global_step/sec: 12.3249
INFO:tensorflow:loss = 1.2407353, step = 218260 (8.115 sec)
INFO:tensorflow:lr = 4.4606528e-05 (8.114 sec)
INFO:tensorflow:global_step/sec: 12.4159
INFO:tensorflow:loss = 1.2420832, step = 218360 (8.053 sec)
INFO:tensorflow:lr = 4.456172e-05 (8.051 sec)
INFO:tensorflow:global_step/sec: 11.9979
INFO:tensorflow:loss = 1.2450037, step = 218460 (8.334 sec)
INFO:tensorflow:lr = 4.4516957e-05 (8.334 sec)
INFO:tensorflow:global_step/sec: 12.2945
INFO:tensorflow:loss = 1.2435594, step = 218560 (8.134 sec)
INFO:tensorflow:lr = 4.447224e-05 (8.135 sec)
INFO:tensorflow:global_step/sec: 12.4887
INFO:tensorflow:loss = 1.2481513, step = 218660 (8.007 sec)
INFO:tensorflow:lr = 4.442757e-05 (8.006 sec)
INFO:tensorflow:global_step/sec: 12.5222
INFO:tensorflow:loss = 1.240262, step = 218760 (7.986 sec)
INFO:tensorflow:lr = 4.438293e-05 (7.986 sec)
INFO:tensorflow:global_step/sec: 12.325
INFO:tensorflow:loss = 1.2430587, step = 218860 (8.119 sec)
INFO:tensorflow:lr = 4.433835e-05 (8.120 sec)
INFO:tensorflow:global_step/sec: 12.7887
INFO:tensorflow:loss = 1.2427464, step = 218960 (7.821 sec)
INFO:tensorflow:lr = 4.4293814e-05 (7.822 sec)
INFO:tensorflow:global_step/sec: 12.9406
INFO:tensorflow:loss = 1.2418499, step = 219060 (7.726 sec)
INFO:tensorflow:lr = 4.4249315e-05 (7.724 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.25481
INFO:tensorflow:loss = 1.2473, step = 219160 (12.109 sec)
INFO:tensorflow:lr = 4.4204873e-05 (12.109 sec)
INFO:tensorflow:global_step/sec: 12.68
INFO:tensorflow:loss = 1.2424519, step = 219260 (7.891 sec)
INFO:tensorflow:lr = 4.4160464e-05 (7.892 sec)
INFO:tensorflow:global_step/sec: 12.6321
INFO:tensorflow:loss = 1.2408296, step = 219360 (7.917 sec)
INFO:tensorflow:lr = 4.4116096e-05 (7.916 sec)
INFO:tensorflow:global_step/sec: 12.2726
INFO:tensorflow:loss = 1.2401123, step = 219460 (8.148 sec)
INFO:tensorflow:lr = 4.4071785e-05 (8.148 sec)
INFO:tensorflow:global_step/sec: 12.3966
INFO:tensorflow:loss = 1.2420714, step = 219560 (8.068 sec)
INFO:tensorflow:lr = 4.4027514e-05 (8.068 sec)
INFO:tensorflow:global_step/sec: 12.2952
INFO:tensorflow:loss = 1.2455899, step = 219660 (8.133 sec)
INFO:tensorflow:lr = 4.398329e-05 (8.133 sec)
INFO:tensorflow:global_step/sec: 12.6129
INFO:tensorflow:loss = 1.2427148, step = 219760 (7.922 sec)
INFO:tensorflow:lr = 4.3939108e-05 (7.922 sec)
INFO:tensorflow:global_step/sec: 12.6133
INFO:tensorflow:loss = 1.2426178, step = 219860 (7.928 sec)
INFO:tensorflow:lr = 4.3894965e-05 (7.928 sec)
INFO:tensorflow:global_step/sec: 12.5467
INFO:tensorflow:loss = 1.241264, step = 219960 (7.974 sec)
INFO:tensorflow:lr = 4.3850876e-05 (7.975 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.39625
INFO:tensorflow:loss = 1.2407962, step = 220060 (11.908 sec)
INFO:tensorflow:lr = 4.3806824e-05 (11.909 sec)
INFO:tensorflow:global_step/sec: 12.6177
INFO:tensorflow:loss = 1.2421613, step = 220160 (7.926 sec)
INFO:tensorflow:lr = 4.3762822e-05 (7.926 sec)
INFO:tensorflow:global_step/sec: 12.7117
INFO:tensorflow:loss = 1.2414433, step = 220260 (7.866 sec)
INFO:tensorflow:lr = 4.3718857e-05 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.8279
INFO:tensorflow:loss = 1.2425734, step = 220360 (7.794 sec)
INFO:tensorflow:lr = 4.3674943e-05 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.2026
INFO:tensorflow:loss = 1.241693, step = 220460 (8.200 sec)
INFO:tensorflow:lr = 4.3631073e-05 (8.204 sec)
INFO:tensorflow:global_step/sec: 12.4323
INFO:tensorflow:loss = 1.2427572, step = 220560 (8.045 sec)
INFO:tensorflow:lr = 4.358724e-05 (8.040 sec)
INFO:tensorflow:global_step/sec: 12.5544
INFO:tensorflow:loss = 1.2428184, step = 220660 (7.962 sec)
INFO:tensorflow:lr = 4.354346e-05 (7.962 sec)
INFO:tensorflow:global_step/sec: 12.6407
INFO:tensorflow:loss = 1.2432847, step = 220760 (7.911 sec)
INFO:tensorflow:lr = 4.3499716e-05 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.7519
INFO:tensorflow:loss = 1.2409394, step = 220860 (7.847 sec)
INFO:tensorflow:lr = 4.3456017e-05 (7.847 sec)
INFO:tensorflow:global_step/sec: 12.6855
INFO:tensorflow:loss = 1.2418656, step = 220960 (7.878 sec)
INFO:tensorflow:lr = 4.341237e-05 (7.880 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.12931
INFO:tensorflow:loss = 1.2419653, step = 221060 (10.956 sec)
INFO:tensorflow:lr = 4.3368756e-05 (10.957 sec)
INFO:tensorflow:global_step/sec: 12.8768
INFO:tensorflow:loss = 1.2422274, step = 221160 (7.761 sec)
INFO:tensorflow:lr = 4.33252e-05 (7.759 sec)
INFO:tensorflow:global_step/sec: 12.5233
INFO:tensorflow:loss = 1.239835, step = 221260 (7.985 sec)
INFO:tensorflow:lr = 4.3281674e-05 (7.990 sec)
INFO:tensorflow:global_step/sec: 12.6333
INFO:tensorflow:loss = 1.2409306, step = 221360 (7.917 sec)
INFO:tensorflow:lr = 4.323819e-05 (7.915 sec)
INFO:tensorflow:global_step/sec: 12.6529
INFO:tensorflow:loss = 1.2407382, step = 221460 (7.909 sec)
INFO:tensorflow:lr = 4.319476e-05 (7.906 sec)
INFO:tensorflow:global_step/sec: 12.6227
INFO:tensorflow:loss = 1.2425914, step = 221560 (7.920 sec)
INFO:tensorflow:lr = 4.315137e-05 (7.920 sec)
INFO:tensorflow:global_step/sec: 12.7449
INFO:tensorflow:loss = 1.2465827, step = 221660 (7.845 sec)
INFO:tensorflow:lr = 4.3108023e-05 (7.845 sec)
INFO:tensorflow:global_step/sec: 12.6797
INFO:tensorflow:loss = 1.2416872, step = 221760 (7.889 sec)
INFO:tensorflow:lr = 4.306472e-05 (7.890 sec)
INFO:tensorflow:global_step/sec: 12.721
INFO:tensorflow:loss = 1.2460314, step = 221860 (7.865 sec)
INFO:tensorflow:lr = 4.3021457e-05 (7.864 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.1301
INFO:tensorflow:loss = 1.2410057, step = 221960 (8.244 sec)
INFO:tensorflow:lr = 4.297825e-05 (8.245 sec)
INFO:tensorflow:global_step/sec: 10.8417
INFO:tensorflow:loss = 1.2405419, step = 222060 (9.219 sec)
INFO:tensorflow:lr = 4.293507e-05 (9.219 sec)
INFO:tensorflow:global_step/sec: 12.6896
INFO:tensorflow:loss = 1.2431215, step = 222160 (7.875 sec)
INFO:tensorflow:lr = 4.289194e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.6973
INFO:tensorflow:loss = 1.2419086, step = 222260 (7.876 sec)
INFO:tensorflow:lr = 4.2848853e-05 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.5823
INFO:tensorflow:loss = 1.2409471, step = 222360 (7.953 sec)
INFO:tensorflow:lr = 4.2805805e-05 (7.949 sec)
INFO:tensorflow:global_step/sec: 12.8736
INFO:tensorflow:loss = 1.2430838, step = 222460 (7.762 sec)
INFO:tensorflow:lr = 4.276281e-05 (7.765 sec)
INFO:tensorflow:global_step/sec: 12.5773
INFO:tensorflow:loss = 1.242637, step = 222560 (7.951 sec)
INFO:tensorflow:lr = 4.271985e-05 (7.948 sec)
INFO:tensorflow:global_step/sec: 12.883
INFO:tensorflow:loss = 1.2404941, step = 222660 (7.768 sec)
INFO:tensorflow:lr = 4.2676944e-05 (7.767 sec)
INFO:tensorflow:global_step/sec: 12.8256
INFO:tensorflow:loss = 1.2423271, step = 222760 (7.791 sec)
INFO:tensorflow:lr = 4.263407e-05 (7.796 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.3713
INFO:tensorflow:loss = 1.2421962, step = 222860 (8.084 sec)
INFO:tensorflow:lr = 4.259124e-05 (8.080 sec)
INFO:tensorflow:global_step/sec: 11.0319
INFO:tensorflow:loss = 1.2413177, step = 222960 (9.068 sec)
INFO:tensorflow:lr = 4.254846e-05 (9.072 sec)
INFO:tensorflow:global_step/sec: 12.547
INFO:tensorflow:loss = 1.2451798, step = 223060 (7.968 sec)
INFO:tensorflow:lr = 4.250572e-05 (7.963 sec)
INFO:tensorflow:global_step/sec: 12.8653
INFO:tensorflow:loss = 1.2412239, step = 223160 (7.777 sec)
INFO:tensorflow:lr = 4.2463023e-05 (7.777 sec)
INFO:tensorflow:global_step/sec: 12.6293
INFO:tensorflow:loss = 1.2409556, step = 223260 (7.917 sec)
INFO:tensorflow:lr = 4.2420364e-05 (7.918 sec)
INFO:tensorflow:global_step/sec: 12.6865
INFO:tensorflow:loss = 1.241664, step = 223360 (7.880 sec)
INFO:tensorflow:lr = 4.237775e-05 (7.879 sec)
INFO:tensorflow:global_step/sec: 12.646
INFO:tensorflow:loss = 1.241841, step = 223460 (7.911 sec)
INFO:tensorflow:lr = 4.233519e-05 (7.911 sec)
INFO:tensorflow:global_step/sec: 12.4094
INFO:tensorflow:loss = 1.2418112, step = 223560 (8.059 sec)
INFO:tensorflow:lr = 4.229266e-05 (8.059 sec)
INFO:tensorflow:global_step/sec: 12.9008
INFO:tensorflow:loss = 1.2413185, step = 223660 (7.745 sec)
INFO:tensorflow:lr = 4.2250176e-05 (7.746 sec)
INFO:tensorflow:global_step/sec: 12.9506
INFO:tensorflow:loss = 1.2488402, step = 223760 (7.725 sec)
INFO:tensorflow:lr = 4.2207732e-05 (7.725 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.7749
INFO:tensorflow:loss = 1.2431126, step = 223860 (8.496 sec)
INFO:tensorflow:lr = 4.2165328e-05 (8.502 sec)
INFO:tensorflow:global_step/sec: 11.4856
INFO:tensorflow:loss = 1.2412598, step = 223960 (8.705 sec)
INFO:tensorflow:lr = 4.2122978e-05 (8.700 sec)
INFO:tensorflow:global_step/sec: 12.8892
INFO:tensorflow:loss = 1.2441949, step = 224060 (7.757 sec)
INFO:tensorflow:lr = 4.2080665e-05 (7.756 sec)
INFO:tensorflow:global_step/sec: 12.6143
INFO:tensorflow:loss = 1.2411182, step = 224160 (7.926 sec)
INFO:tensorflow:lr = 4.203839e-05 (7.929 sec)
INFO:tensorflow:global_step/sec: 12.9576
INFO:tensorflow:loss = 1.2425789, step = 224260 (7.719 sec)
INFO:tensorflow:lr = 4.1996165e-05 (7.716 sec)
INFO:tensorflow:global_step/sec: 12.6436
INFO:tensorflow:loss = 1.2407291, step = 224360 (7.910 sec)
INFO:tensorflow:lr = 4.1953976e-05 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.9342
INFO:tensorflow:loss = 1.241793, step = 224460 (7.727 sec)
INFO:tensorflow:lr = 4.1911837e-05 (7.726 sec)
INFO:tensorflow:global_step/sec: 12.7712
INFO:tensorflow:loss = 1.2459935, step = 224560 (7.830 sec)
INFO:tensorflow:lr = 4.186973e-05 (7.838 sec)
INFO:tensorflow:global_step/sec: 12.5492
INFO:tensorflow:loss = 1.241738, step = 224660 (7.969 sec)
INFO:tensorflow:lr = 4.1827676e-05 (7.967 sec)
INFO:tensorflow:global_step/sec: 12.9812
INFO:tensorflow:loss = 1.2425698, step = 224760 (7.706 sec)
INFO:tensorflow:lr = 4.1785654e-05 (7.700 sec)
INFO:tensorflow:global_step/sec: 12.5881
INFO:tensorflow:loss = 1.2425317, step = 224860 (7.955 sec)
INFO:tensorflow:lr = 4.1743675e-05 (7.955 sec)
INFO:tensorflow:Saving checkpoints for 224940 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.24172.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-224940
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show playing ] [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                     in:get_event                                                                 
  ________________________|______________________________________________                          
 |     |    |             |                                         sl:location                   
 |     |    |             |                                              |                         
 |     |    |             |                                       in:get_location                 
 |     |    |             |                              ________________|_______________          
 |     |    |      sl:category_even              sl:search_radius                 sl:location_user
 |     |    |             t                             |                                |        
 |     |    |    _________|_________________            |                                |         
what times are the    nutcracker    show playing       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-224940
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv
INFO:tensorflow:Evaluation: Testing (Exact Match) Accuracy: 0.728
INFO:tensorflow:Best (Exact Match) Accuracy: 0.733
INFO:tensorflow:Calling model_fn.
/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:38: DeprecationWarning: elementwise comparison failed; this will raise an error in the future.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
[<tf.Variable 'Embedding/dense/kernel:0' shape=(1024, 300) dtype=float32_ref>,
 <tf.Variable 'Embedding/dense/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Embedding/glove:0' shape=(8692, 300) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/kernel:0' shape=(900, 1200) dtype=float32_ref>,
 <tf.Variable 'Encoder/lstm_fused_cell_1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/affine_bias:0' shape=(8692,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_0/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/self_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/kernel:0' shape=(300, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/query/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/key/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/kernel:0' shape=(600, 512) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/value/bias:0' shape=(512,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/kernel:0' shape=(512, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/encdec_attention/multihead_attention/output/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/past_poswise_ln/gamma:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/kernel:0' shape=(300, 1200) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv1/bias:0' shape=(1200,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/kernel:0' shape=(1200, 300) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/layer_1/ffn/conv2/bias:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/beta:0' shape=(300,) dtype=float32_ref>,
 <tf.Variable 'Decoder/transformer_decoder/gamma:0' shape=(300,) dtype=float32_ref>]
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Create CheckpointSaverHook.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-224940
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
INFO:tensorflow:Saving checkpoints for 224940 into ../model/lstm_transformer/model.ckpt.
Reading ../data/train.tsv
INFO:tensorflow:loss = 1.245515, step = 224940
INFO:tensorflow:lr = 4.171013e-05
INFO:tensorflow:global_step/sec: 10.21
INFO:tensorflow:loss = 1.2412355, step = 225040 (9.801 sec)
INFO:tensorflow:lr = 4.166823e-05 (9.802 sec)
INFO:tensorflow:global_step/sec: 12.5524
INFO:tensorflow:loss = 1.2411782, step = 225140 (7.966 sec)
INFO:tensorflow:lr = 4.1626372e-05 (7.966 sec)
INFO:tensorflow:global_step/sec: 12.9635
INFO:tensorflow:loss = 1.2436695, step = 225240 (7.714 sec)
INFO:tensorflow:lr = 4.158456e-05 (7.714 sec)
INFO:tensorflow:global_step/sec: 12.8617
INFO:tensorflow:loss = 1.2410346, step = 225340 (7.770 sec)
INFO:tensorflow:lr = 4.1542786e-05 (7.773 sec)
INFO:tensorflow:global_step/sec: 12.7585
INFO:tensorflow:loss = 1.2414058, step = 225440 (7.842 sec)
INFO:tensorflow:lr = 4.1501055e-05 (7.840 sec)
INFO:tensorflow:global_step/sec: 12.5799
INFO:tensorflow:loss = 1.2416364, step = 225540 (7.948 sec)
INFO:tensorflow:lr = 4.145937e-05 (7.948 sec)
INFO:tensorflow:global_step/sec: 12.6295
INFO:tensorflow:loss = 1.241216, step = 225640 (7.919 sec)
INFO:tensorflow:lr = 4.141772e-05 (7.919 sec)
INFO:tensorflow:global_step/sec: 12.63
INFO:tensorflow:loss = 1.2452391, step = 225740 (7.920 sec)
INFO:tensorflow:lr = 4.137612e-05 (7.920 sec)
INFO:tensorflow:global_step/sec: 12.7772
INFO:tensorflow:loss = 1.2397666, step = 225840 (7.825 sec)
INFO:tensorflow:lr = 4.133455e-05 (7.825 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.1808
INFO:tensorflow:loss = 1.240168, step = 225940 (12.223 sec)
INFO:tensorflow:lr = 4.1293028e-05 (12.223 sec)
INFO:tensorflow:global_step/sec: 12.7142
INFO:tensorflow:loss = 1.242873, step = 226040 (7.866 sec)
INFO:tensorflow:lr = 4.125155e-05 (7.865 sec)
INFO:tensorflow:global_step/sec: 12.8279
INFO:tensorflow:loss = 1.2412157, step = 226140 (7.794 sec)
INFO:tensorflow:lr = 4.1210107e-05 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.566
INFO:tensorflow:loss = 1.2413632, step = 226240 (7.955 sec)
INFO:tensorflow:lr = 4.1168714e-05 (7.954 sec)
INFO:tensorflow:global_step/sec: 12.7163
INFO:tensorflow:loss = 1.2435849, step = 226340 (7.866 sec)
INFO:tensorflow:lr = 4.112736e-05 (7.867 sec)
INFO:tensorflow:global_step/sec: 12.8243
INFO:tensorflow:loss = 1.2454369, step = 226440 (7.796 sec)
INFO:tensorflow:lr = 4.108604e-05 (7.795 sec)
INFO:tensorflow:global_step/sec: 12.6798
INFO:tensorflow:loss = 1.245144, step = 226540 (7.887 sec)
INFO:tensorflow:lr = 4.1044772e-05 (7.886 sec)
INFO:tensorflow:global_step/sec: 12.7597
INFO:tensorflow:loss = 1.2447907, step = 226640 (7.837 sec)
INFO:tensorflow:lr = 4.100354e-05 (7.837 sec)
INFO:tensorflow:global_step/sec: 12.6933
INFO:tensorflow:loss = 1.2408261, step = 226740 (7.882 sec)
INFO:tensorflow:lr = 4.0962354e-05 (7.883 sec)
INFO:tensorflow:global_step/sec: 12.4884
INFO:tensorflow:loss = 1.240148, step = 226840 (8.009 sec)
INFO:tensorflow:lr = 4.09212e-05 (8.008 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.39542
INFO:tensorflow:loss = 1.2397572, step = 226940 (11.906 sec)
INFO:tensorflow:lr = 4.0880095e-05 (11.906 sec)
INFO:tensorflow:global_step/sec: 12.7057
INFO:tensorflow:loss = 1.2418107, step = 227040 (7.877 sec)
INFO:tensorflow:lr = 4.0839033e-05 (7.877 sec)
INFO:tensorflow:global_step/sec: 12.6331
INFO:tensorflow:loss = 1.2409166, step = 227140 (7.910 sec)
INFO:tensorflow:lr = 4.0798008e-05 (7.910 sec)
INFO:tensorflow:global_step/sec: 12.865
INFO:tensorflow:loss = 1.2418015, step = 227240 (7.772 sec)
INFO:tensorflow:lr = 4.075703e-05 (7.772 sec)
INFO:tensorflow:global_step/sec: 12.8334
INFO:tensorflow:loss = 1.2457359, step = 227340 (7.797 sec)
INFO:tensorflow:lr = 4.0716084e-05 (7.797 sec)
INFO:tensorflow:global_step/sec: 12.8722
INFO:tensorflow:loss = 1.2415484, step = 227440 (7.768 sec)
INFO:tensorflow:lr = 4.067518e-05 (7.768 sec)
INFO:tensorflow:global_step/sec: 12.6562
INFO:tensorflow:loss = 1.2438579, step = 227540 (7.902 sec)
INFO:tensorflow:lr = 4.0634328e-05 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.728
INFO:tensorflow:loss = 1.2444311, step = 227640 (7.854 sec)
INFO:tensorflow:lr = 4.0593506e-05 (7.858 sec)
INFO:tensorflow:global_step/sec: 12.7264
INFO:tensorflow:loss = 1.2432747, step = 227740 (7.860 sec)
INFO:tensorflow:lr = 4.055273e-05 (7.855 sec)
INFO:tensorflow:global_step/sec: 12.9611
INFO:tensorflow:loss = 1.2415364, step = 227840 (7.717 sec)
INFO:tensorflow:lr = 4.0511994e-05 (7.718 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.30722
INFO:tensorflow:loss = 1.2399315, step = 227940 (12.039 sec)
INFO:tensorflow:lr = 4.0471296e-05 (12.038 sec)
INFO:tensorflow:global_step/sec: 12.6838
INFO:tensorflow:loss = 1.2412345, step = 228040 (7.878 sec)
INFO:tensorflow:lr = 4.0430645e-05 (7.878 sec)
INFO:tensorflow:global_step/sec: 12.9424
INFO:tensorflow:loss = 1.2414714, step = 228140 (7.732 sec)
INFO:tensorflow:lr = 4.039003e-05 (7.732 sec)
INFO:tensorflow:global_step/sec: 13.0548
INFO:tensorflow:loss = 1.2409471, step = 228240 (7.660 sec)
INFO:tensorflow:lr = 4.034946e-05 (7.659 sec)
INFO:tensorflow:global_step/sec: 12.6404
INFO:tensorflow:loss = 1.2413936, step = 228340 (7.906 sec)
INFO:tensorflow:lr = 4.0308925e-05 (7.907 sec)
INFO:tensorflow:global_step/sec: 12.6828
INFO:tensorflow:loss = 1.2451051, step = 228440 (7.886 sec)
INFO:tensorflow:lr = 4.026843e-05 (7.887 sec)
INFO:tensorflow:global_step/sec: 12.8877
INFO:tensorflow:loss = 1.2420641, step = 228540 (7.759 sec)
INFO:tensorflow:lr = 4.0227984e-05 (7.757 sec)
INFO:tensorflow:global_step/sec: 12.6603
INFO:tensorflow:loss = 1.2408705, step = 228640 (7.901 sec)
INFO:tensorflow:lr = 4.0187577e-05 (7.902 sec)
INFO:tensorflow:global_step/sec: 12.9905
INFO:tensorflow:loss = 1.2428869, step = 228740 (7.700 sec)
INFO:tensorflow:lr = 4.014721e-05 (7.699 sec)
INFO:tensorflow:global_step/sec: 12.8204
INFO:tensorflow:loss = 1.2405547, step = 228840 (7.800 sec)
INFO:tensorflow:lr = 4.0106876e-05 (7.803 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.38389
INFO:tensorflow:loss = 1.2480453, step = 228940 (11.929 sec)
INFO:tensorflow:lr = 4.0066585e-05 (11.926 sec)
INFO:tensorflow:global_step/sec: 12.8982
INFO:tensorflow:loss = 1.242588, step = 229040 (7.752 sec)
INFO:tensorflow:lr = 4.0026338e-05 (7.752 sec)
INFO:tensorflow:global_step/sec: 12.7452
INFO:tensorflow:loss = 1.2459991, step = 229140 (7.848 sec)
INFO:tensorflow:lr = 3.9986127e-05 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.8336
INFO:tensorflow:loss = 1.2415149, step = 229240 (7.788 sec)
INFO:tensorflow:lr = 3.994596e-05 (7.788 sec)
INFO:tensorflow:global_step/sec: 12.2859
INFO:tensorflow:loss = 1.242039, step = 229340 (8.141 sec)
INFO:tensorflow:lr = 3.9905834e-05 (8.142 sec)
INFO:tensorflow:global_step/sec: 12.5119
INFO:tensorflow:loss = 1.25192, step = 229440 (7.995 sec)
INFO:tensorflow:lr = 3.986575e-05 (7.993 sec)
INFO:tensorflow:global_step/sec: 12.7531
INFO:tensorflow:loss = 1.245667, step = 229540 (7.844 sec)
INFO:tensorflow:lr = 3.9825703e-05 (7.844 sec)
INFO:tensorflow:global_step/sec: 12.8561
INFO:tensorflow:loss = 1.2407379, step = 229640 (7.773 sec)
INFO:tensorflow:lr = 3.9785693e-05 (7.772 sec)
INFO:tensorflow:global_step/sec: 12.7172
INFO:tensorflow:loss = 1.2451239, step = 229740 (7.867 sec)
INFO:tensorflow:lr = 3.9745733e-05 (7.867 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 8.73178
INFO:tensorflow:loss = 1.2411838, step = 229840 (11.447 sec)
INFO:tensorflow:lr = 3.9705807e-05 (11.449 sec)
INFO:tensorflow:global_step/sec: 12.9561
INFO:tensorflow:loss = 1.2413689, step = 229940 (7.720 sec)
INFO:tensorflow:lr = 3.9665916e-05 (7.724 sec)
INFO:tensorflow:global_step/sec: 12.7091
INFO:tensorflow:loss = 1.2430978, step = 230040 (7.869 sec)
INFO:tensorflow:lr = 3.9626073e-05 (7.863 sec)
INFO:tensorflow:global_step/sec: 12.7369
INFO:tensorflow:loss = 1.242768, step = 230140 (7.851 sec)
INFO:tensorflow:lr = 3.958627e-05 (7.852 sec)
INFO:tensorflow:global_step/sec: 12.7465
INFO:tensorflow:loss = 1.2418132, step = 230240 (7.848 sec)
INFO:tensorflow:lr = 3.9546507e-05 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.9642
INFO:tensorflow:loss = 1.2418685, step = 230340 (7.710 sec)
INFO:tensorflow:lr = 3.950678e-05 (7.709 sec)
INFO:tensorflow:global_step/sec: 12.4698
INFO:tensorflow:loss = 1.2514341, step = 230440 (8.018 sec)
INFO:tensorflow:lr = 3.946709e-05 (8.019 sec)
INFO:tensorflow:global_step/sec: 12.4999
INFO:tensorflow:loss = 1.2429241, step = 230540 (8.008 sec)
INFO:tensorflow:lr = 3.942745e-05 (8.010 sec)
INFO:tensorflow:global_step/sec: 12.7492
INFO:tensorflow:loss = 1.2442654, step = 230640 (7.841 sec)
INFO:tensorflow:lr = 3.938784e-05 (7.839 sec)
INFO:tensorflow:global_step/sec: 12.6677
INFO:tensorflow:loss = 1.2414587, step = 230740 (7.889 sec)
INFO:tensorflow:lr = 3.9348277e-05 (7.890 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 9.14225
INFO:tensorflow:loss = 1.2435497, step = 230840 (10.951 sec)
INFO:tensorflow:lr = 3.9308747e-05 (10.950 sec)
INFO:tensorflow:global_step/sec: 12.8207
INFO:tensorflow:loss = 1.2424185, step = 230940 (7.791 sec)
INFO:tensorflow:lr = 3.926926e-05 (7.791 sec)
INFO:tensorflow:global_step/sec: 12.5554
INFO:tensorflow:loss = 1.2412125, step = 231040 (7.966 sec)
INFO:tensorflow:lr = 3.9229813e-05 (7.966 sec)
INFO:tensorflow:global_step/sec: 12.9233
INFO:tensorflow:loss = 1.2414656, step = 231140 (7.733 sec)
INFO:tensorflow:lr = 3.9190403e-05 (7.734 sec)
INFO:tensorflow:global_step/sec: 12.6232
INFO:tensorflow:loss = 1.2446767, step = 231240 (7.922 sec)
INFO:tensorflow:lr = 3.915104e-05 (7.926 sec)
INFO:tensorflow:global_step/sec: 12.8202
INFO:tensorflow:loss = 1.2399716, step = 231340 (7.804 sec)
INFO:tensorflow:lr = 3.911171e-05 (7.800 sec)
INFO:tensorflow:global_step/sec: 12.6593
INFO:tensorflow:loss = 1.2404665, step = 231440 (7.896 sec)
INFO:tensorflow:lr = 3.9072416e-05 (7.899 sec)
INFO:tensorflow:global_step/sec: 12.8141
INFO:tensorflow:loss = 1.2436392, step = 231540 (7.805 sec)
INFO:tensorflow:lr = 3.9033173e-05 (7.804 sec)
INFO:tensorflow:global_step/sec: 12.6215
INFO:tensorflow:loss = 1.2410214, step = 231640 (7.928 sec)
INFO:tensorflow:lr = 3.899396e-05 (7.925 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.0998
INFO:tensorflow:loss = 1.2402171, step = 231740 (8.273 sec)
INFO:tensorflow:lr = 3.8954797e-05 (8.274 sec)
INFO:tensorflow:global_step/sec: 10.8586
INFO:tensorflow:loss = 1.2410094, step = 231840 (9.195 sec)
INFO:tensorflow:lr = 3.8915663e-05 (9.195 sec)
INFO:tensorflow:global_step/sec: 12.9364
INFO:tensorflow:loss = 1.2405255, step = 231940 (7.729 sec)
INFO:tensorflow:lr = 3.887657e-05 (7.735 sec)
INFO:tensorflow:global_step/sec: 12.591
INFO:tensorflow:loss = 1.2420667, step = 232040 (7.948 sec)
INFO:tensorflow:lr = 3.883752e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.6597
INFO:tensorflow:loss = 1.2402742, step = 232140 (7.898 sec)
INFO:tensorflow:lr = 3.8798502e-05 (7.898 sec)
INFO:tensorflow:global_step/sec: 12.7635
INFO:tensorflow:loss = 1.2407392, step = 232240 (7.837 sec)
INFO:tensorflow:lr = 3.875953e-05 (7.837 sec)
INFO:tensorflow:global_step/sec: 12.7974
INFO:tensorflow:loss = 1.2414687, step = 232340 (7.813 sec)
INFO:tensorflow:lr = 3.872059e-05 (7.813 sec)
INFO:tensorflow:global_step/sec: 12.7841
INFO:tensorflow:loss = 1.2432356, step = 232440 (7.823 sec)
INFO:tensorflow:lr = 3.8681694e-05 (7.824 sec)
INFO:tensorflow:global_step/sec: 12.6057
INFO:tensorflow:loss = 1.241169, step = 232540 (7.931 sec)
INFO:tensorflow:lr = 3.8642844e-05 (7.931 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 12.7646
INFO:tensorflow:loss = 1.2469207, step = 232640 (7.833 sec)
INFO:tensorflow:lr = 3.860402e-05 (7.833 sec)
INFO:tensorflow:global_step/sec: 10.9391
INFO:tensorflow:loss = 1.2405813, step = 232740 (9.139 sec)
INFO:tensorflow:lr = 3.8565246e-05 (9.139 sec)
INFO:tensorflow:global_step/sec: 12.9065
INFO:tensorflow:loss = 1.2419277, step = 232840 (7.753 sec)
INFO:tensorflow:lr = 3.8526505e-05 (7.753 sec)
INFO:tensorflow:global_step/sec: 12.7425
INFO:tensorflow:loss = 1.241205, step = 232940 (7.847 sec)
INFO:tensorflow:lr = 3.84878e-05 (7.848 sec)
INFO:tensorflow:global_step/sec: 12.6472
INFO:tensorflow:loss = 1.241587, step = 233040 (7.906 sec)
INFO:tensorflow:lr = 3.8449143e-05 (7.906 sec)
INFO:tensorflow:global_step/sec: 12.274
INFO:tensorflow:loss = 1.2420787, step = 233140 (8.144 sec)
INFO:tensorflow:lr = 3.8410515e-05 (8.142 sec)
INFO:tensorflow:global_step/sec: 12.1353
INFO:tensorflow:loss = 1.2417104, step = 233240 (8.247 sec)
INFO:tensorflow:lr = 3.8371934e-05 (8.248 sec)
INFO:tensorflow:global_step/sec: 12.1941
INFO:tensorflow:loss = 1.2428356, step = 233340 (8.194 sec)
INFO:tensorflow:lr = 3.833339e-05 (8.194 sec)
INFO:tensorflow:global_step/sec: 12.1589
INFO:tensorflow:loss = 1.2426999, step = 233440 (8.227 sec)
INFO:tensorflow:lr = 3.8294882e-05 (8.228 sec)
INFO:tensorflow:global_step/sec: 11.8032
INFO:tensorflow:loss = 1.240998, step = 233540 (8.472 sec)
INFO:tensorflow:lr = 3.8256414e-05 (8.473 sec)
Reading ../data/train.tsv
INFO:tensorflow:global_step/sec: 11.5196
INFO:tensorflow:loss = 1.2467922, step = 233640 (8.685 sec)
INFO:tensorflow:lr = 3.8217982e-05 (8.685 sec)
INFO:tensorflow:global_step/sec: 11.2044
INFO:tensorflow:loss = 1.239357, step = 233740 (8.920 sec)
INFO:tensorflow:lr = 3.8179598e-05 (8.917 sec)
INFO:tensorflow:global_step/sec: 12.3381
INFO:tensorflow:loss = 1.240096, step = 233840 (8.109 sec)
INFO:tensorflow:lr = 3.814124e-05 (8.109 sec)
INFO:tensorflow:global_step/sec: 12.2644
INFO:tensorflow:loss = 1.2404408, step = 233940 (8.156 sec)
INFO:tensorflow:lr = 3.8102924e-05 (8.155 sec)
INFO:tensorflow:global_step/sec: 12.5479
INFO:tensorflow:loss = 1.2412769, step = 234040 (7.964 sec)
INFO:tensorflow:lr = 3.8064652e-05 (7.965 sec)
INFO:tensorflow:global_step/sec: 12.4405
INFO:tensorflow:loss = 1.2444044, step = 234140 (8.037 sec)
INFO:tensorflow:lr = 3.8026414e-05 (8.040 sec)
INFO:tensorflow:global_step/sec: 12.5963
INFO:tensorflow:loss = 1.2408541, step = 234240 (7.939 sec)
INFO:tensorflow:lr = 3.798822e-05 (7.935 sec)
INFO:tensorflow:global_step/sec: 12.8113
INFO:tensorflow:loss = 1.2447264, step = 234340 (7.813 sec)
INFO:tensorflow:lr = 3.7950056e-05 (7.813 sec)
INFO:tensorflow:global_step/sec: 12.5906
INFO:tensorflow:loss = 1.2432296, step = 234440 (7.941 sec)
INFO:tensorflow:lr = 3.791193e-05 (7.942 sec)
INFO:tensorflow:global_step/sec: 12.2831
INFO:tensorflow:loss = 1.2440478, step = 234540 (8.141 sec)
INFO:tensorflow:lr = 3.787385e-05 (8.140 sec)
INFO:tensorflow:global_step/sec: 12.4469
INFO:tensorflow:loss = 1.2417731, step = 234640 (8.028 sec)
INFO:tensorflow:lr = 3.78358e-05 (8.029 sec)
INFO:tensorflow:Saving checkpoints for 234720 into ../model/lstm_transformer/model.ckpt.
INFO:tensorflow:Loss for final step: 1.2419497.
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-234720
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
------------
minimal test
utterance: what times are the nutcracker show playing near me
parsed: [ in:get_event what times are [ sl:category_event the nutcracker show ] playing [ sl:location [ in:get_location [ sl:search_radius near ] [ sl:location_user me ] ] ] ]

                       in:get_event                                                                        
  __________________________|_____________________________________________________                          
 |     |    |     |                        |                                 sl:location                   
 |     |    |     |                        |                                      |                         
 |     |    |     |                        |                               in:get_location                 
 |     |    |     |                        |                      ________________|_______________          
 |     |    |     |                 sl:category_even      sl:search_radius                 sl:location_user
 |     |    |     |                        t                     |                                |        
 |     |    |     |          ______________|__________           |                                |         
what times are playing     the         nutcracker    show       near                              me       

------------
Reading ../data/test.tsv
INFO:tensorflow:Calling model_fn.
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Saver not created because there are no variables in the graph to restore
INFO:tensorflow:Done calling model_fn.
INFO:tensorflow:Graph was finalized.
INFO:tensorflow:Restoring parameters from ../model/lstm_transformer/model.ckpt-234720
INFO:tensorflow:Running local_init_op.
INFO:tensorflow:Done running local_init_op.
Reading ../data/test.tsv