In [1]:
from google.colab import drive
drive.mount('/content/gdrive')
import os
os.chdir('/content/gdrive/My Drive/finch/tensorflow2/text_classification/imdb/main')
Drive already mounted at /content/gdrive; to attempt to forcibly remount, call drive.mount("/content/gdrive", force_remount=True).
In [2]:
%tensorflow_version 2.x
!pip install tensorflow-addons
!pip install transformers
Requirement already satisfied: tensorflow-addons in /usr/local/lib/python3.6/dist-packages (0.8.3)
Requirement already satisfied: typeguard in /usr/local/lib/python3.6/dist-packages (from tensorflow-addons) (2.7.1)
Requirement already satisfied: transformers in /usr/local/lib/python3.6/dist-packages (3.0.2)
Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.6/dist-packages (from transformers) (4.41.1)
Requirement already satisfied: filelock in /usr/local/lib/python3.6/dist-packages (from transformers) (3.0.12)
Requirement already satisfied: requests in /usr/local/lib/python3.6/dist-packages (from transformers) (2.23.0)
Requirement already satisfied: tokenizers==0.8.1.rc1 in /usr/local/lib/python3.6/dist-packages (from transformers) (0.8.1rc1)
Requirement already satisfied: sacremoses in /usr/local/lib/python3.6/dist-packages (from transformers) (0.0.43)
Requirement already satisfied: sentencepiece!=0.1.92 in /usr/local/lib/python3.6/dist-packages (from transformers) (0.1.91)
Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.6/dist-packages (from transformers) (2019.12.20)
Requirement already satisfied: dataclasses; python_version < "3.7" in /usr/local/lib/python3.6/dist-packages (from transformers) (0.7)
Requirement already satisfied: packaging in /usr/local/lib/python3.6/dist-packages (from transformers) (20.4)
Requirement already satisfied: numpy in /usr/local/lib/python3.6/dist-packages (from transformers) (1.18.5)
Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.6/dist-packages (from requests->transformers) (2020.6.20)
Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.6/dist-packages (from requests->transformers) (3.0.4)
Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.6/dist-packages (from requests->transformers) (2.10)
Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.6/dist-packages (from requests->transformers) (1.24.3)
Requirement already satisfied: click in /usr/local/lib/python3.6/dist-packages (from sacremoses->transformers) (7.1.2)
Requirement already satisfied: six in /usr/local/lib/python3.6/dist-packages (from sacremoses->transformers) (1.12.0)
Requirement already satisfied: joblib in /usr/local/lib/python3.6/dist-packages (from sacremoses->transformers) (0.16.0)
Requirement already satisfied: pyparsing>=2.0.2 in /usr/local/lib/python3.6/dist-packages (from packaging->transformers) (2.4.7)
In [3]:
from transformers import RobertaTokenizer, TFRobertaModel

import tensorflow as tf
import tensorflow_addons as tfa
import numpy as np
import pprint
import logging
import time

print("TensorFlow Version", tf.__version__)
print('GPU Enabled:', tf.test.is_gpu_available())
TensorFlow Version 2.2.0
WARNING:tensorflow:From <ipython-input-3-1e763de9ead9>:11: is_gpu_available (from tensorflow.python.framework.test_util) is deprecated and will be removed in a future version.
Instructions for updating:
Use `tf.config.list_physical_devices('GPU')` instead.
GPU Enabled: True
In [4]:
params = {
  'train_paths': [
    '../data/train_bt_part1.txt',
    '../data/train_bt_part2.txt',
    '../data/train_bt_part3.txt',
    '../data/train_bt_part4.txt',
    '../data/train_bt_part5.txt',
    '../data/train_bt_part6.txt',
  ],
  'test_paths': [
    '../data/test.txt',
  ],
  'pretrain_path': 'roberta-base',
  'num_samples': 25000 * 2,
  'batch_size': 8,
  'max_len': 300,
  'num_patience': 5,
  'init_lr': 1e-5,
  'max_lr': 3e-5,
}
In [5]:
tokenizer = RobertaTokenizer.from_pretrained(params['pretrain_path'],
                                             lowercase = True,
                                             add_special_tokens = True)
In [6]:
def data_generator(f_paths, params):
  for f_path in f_paths:
    with open(f_path) as f:
      print('Reading', f_path)
      for line in f:
        line = line.rstrip()
        label, text = line.split('\t')
        text = ['<s>'] + tokenizer.tokenize(text) + ['</s>']
        if len(text) > params['max_len']:
          _max_len = params['max_len'] // 2
          text = text[:_max_len] + text[-_max_len:]
        seg = [0] * len(text)
        text = tokenizer.convert_tokens_to_ids(text)
        y = int(label)
        yield text, y


def dataset(is_training, params):
  _shapes = ([None], ())
  _types = (tf.int32, tf.int32)
  _pads = (1, -1)
  
  if is_training:
    ds = tf.data.Dataset.from_generator(
      lambda: data_generator(params['train_paths'], params),
      output_shapes = _shapes,
      output_types = _types,)
    ds = ds.shuffle(params['num_samples'])
    ds = ds.padded_batch(params['batch_size'], _shapes, _pads)
    ds = ds.prefetch(tf.data.experimental.AUTOTUNE)
  else:
    ds = tf.data.Dataset.from_generator(
      lambda: data_generator(params['test_paths'], params),
      output_shapes = _shapes,
      output_types = _types,)
    ds = ds.padded_batch(params['batch_size'], _shapes, _pads)
    ds = ds.prefetch(tf.data.experimental.AUTOTUNE)
  
  return ds
In [7]:
# input stream ids check
text, _ = next(data_generator(params['train_paths'], params))
print(text)
Reading ../data/train_bt_part1.txt
[0, 118, 1979, 75, 5956, 42, 65, 190, 15, 1404, 7582, 363, 2]
In [8]:
class RobertaFinetune(tf.keras.Model):
  def __init__(self, params):
    super(RobertaFinetune, self).__init__()
    self.bert = TFRobertaModel.from_pretrained(params['pretrain_path'],
                                               trainable = True)
    self.drop_1 = tf.keras.layers.Dropout(.1)
    self.fc = tf.keras.layers.Dense(300, tf.nn.swish, name='down_stream/fc')
    self.drop_2 = tf.keras.layers.Dropout(.1)
    self.out = tf.keras.layers.Dense(2, name='down_stream/out')

  def call(self, bert_inputs, training):
    bert_inputs = [tf.cast(inp, tf.int32) for inp in bert_inputs]
    x = self.bert(bert_inputs, training=training)[1]
    x = self.drop_1(x, training=training)
    x = self.fc(x)
    x = self.drop_2(x, training=training)
    x = self.out(x)
    return x
In [ ]:
model = RobertaFinetune(params)
model.build([[None, None], [None, None], [None, None]])
pprint.pprint([(v.name, v.shape) for v in model.trainable_variables])

step_size = 2 * params['num_samples'] // params['batch_size']
decay_lr = tfa.optimizers.Triangular2CyclicalLearningRate(
  initial_learning_rate = params['init_lr'],
  maximal_learning_rate = params['max_lr'],
  step_size = step_size,)
optim = tf.optimizers.Adam(params['init_lr'])
global_step = 0

best_acc = .0
count = 0

t0 = time.time()
logger = logging.getLogger('tensorflow')
logger.setLevel(logging.INFO)

while True:
  # TRAINING
  for (text, labels) in dataset(is_training=True, params=params):
    with tf.GradientTape() as tape:
      masks = tf.cast(tf.math.not_equal(text, 1), tf.int32)
      logits = model([text, masks], training=True)
      loss = tf.compat.v1.losses.softmax_cross_entropy(
        tf.one_hot(labels, 2, dtype=tf.float32),
        logits = logits,
        label_smoothing = .2,)
      
    optim.lr.assign(decay_lr(global_step))
    grads = tape.gradient(loss, model.trainable_variables)
    grads, _ = tf.clip_by_global_norm(grads, 5.)
    optim.apply_gradients(zip(grads, model.trainable_variables))
    
    if global_step % 100 == 0:
      logger.info("Step {} | Loss: {:.4f} | Spent: {:.1f} secs | LR: {:.6f}".format(
          global_step, loss.numpy().item(), time.time()-t0, optim.lr.numpy().item()))
      t0 = time.time()
    global_step += 1
  
  # EVALUATION
  m = tf.keras.metrics.Accuracy()

  for (text, labels) in dataset(is_training=False, params=params):
    masks = tf.cast(tf.math.not_equal(text, 1), tf.int32)
    logits = model([text, masks], training=False)
    m.update_state(y_true=labels, y_pred=tf.argmax(logits, -1))

  acc = m.result().numpy()
  logger.info("Evaluation: Testing Accuracy: {:.3f}".format(acc))

  if acc > best_acc:
    best_acc = acc
    # you can save model here
    count = 0
  else:
    count += 1
  logger.info("Best Accuracy: {:.3f}".format(best_acc))

  if count == params['num_patience']:
    print(params['num_patience'], "times not improve the best result, therefore stop training")
    break
Some weights of the model checkpoint at roberta-base were not used when initializing TFRobertaModel: ['lm_head']
- This IS expected if you are initializing TFRobertaModel from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPretraining model).
- This IS NOT expected if you are initializing TFRobertaModel from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
All the weights of TFRobertaModel were initialized from the model checkpoint at roberta-base.
If your task is similar to the task the model of the ckeckpoint was trained on, you can already use TFRobertaModel for predictions without further training.
[('tf_roberta_model/roberta/encoder/layer_._0/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._0/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._0/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._0/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._1/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._1/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._1/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._2/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._2/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._2/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._3/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._3/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._3/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._4/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._4/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._4/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._5/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._5/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._5/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._6/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._6/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._6/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._7/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._7/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._7/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._8/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._8/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._8/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._9/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._9/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._9/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._10/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._10/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._10/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/self/query/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/self/query/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/self/key/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/self/key/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/self/value/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/self/value/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/output/dense/kernel:0',
  TensorShape([768, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/attention/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/intermediate/dense/kernel:0',
  TensorShape([768, 3072])),
 ('tf_roberta_model/roberta/encoder/layer_._11/intermediate/dense/bias:0',
  TensorShape([3072])),
 ('tf_roberta_model/roberta/encoder/layer_._11/output/dense/kernel:0',
  TensorShape([3072, 768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/output/dense/bias:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/output/LayerNorm/gamma:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/encoder/layer_._11/output/LayerNorm/beta:0',
  TensorShape([768])),
 ('tf_roberta_model/roberta/pooler/dense/kernel:0', TensorShape([768, 768])),
 ('tf_roberta_model/roberta/pooler/dense/bias:0', TensorShape([768])),
 ('tf_roberta_model/roberta/embeddings/word_embeddings/weight:0',
  TensorShape([50265, 768])),
 ('tf_roberta_model/roberta/embeddings/position_embeddings/embeddings:0',
  TensorShape([514, 768])),
 ('tf_roberta_model/roberta/embeddings/token_type_embeddings/embeddings:0',
  TensorShape([1, 768])),
 ('tf_roberta_model/roberta/embeddings/LayerNorm/gamma:0', TensorShape([768])),
 ('tf_roberta_model/roberta/embeddings/LayerNorm/beta:0', TensorShape([768])),
 ('down_stream/fc/kernel:0', TensorShape([768, 300])),
 ('down_stream/fc/bias:0', TensorShape([300])),
 ('down_stream/out/kernel:0', TensorShape([300, 2])),
 ('down_stream/out/bias:0', TensorShape([2]))]
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 0 | Loss: 0.6991 | Spent: 57.9 secs | LR: 0.000010
INFO:tensorflow:Step 100 | Loss: 0.4685 | Spent: 44.7 secs | LR: 0.000010
INFO:tensorflow:Step 200 | Loss: 0.3321 | Spent: 44.8 secs | LR: 0.000010
INFO:tensorflow:Step 300 | Loss: 0.6533 | Spent: 44.4 secs | LR: 0.000010
INFO:tensorflow:Step 400 | Loss: 0.8705 | Spent: 44.7 secs | LR: 0.000011
INFO:tensorflow:Step 500 | Loss: 0.3697 | Spent: 45.1 secs | LR: 0.000011
INFO:tensorflow:Step 600 | Loss: 0.3400 | Spent: 44.8 secs | LR: 0.000011
INFO:tensorflow:Step 700 | Loss: 0.4978 | Spent: 44.9 secs | LR: 0.000011
INFO:tensorflow:Step 800 | Loss: 0.5003 | Spent: 44.7 secs | LR: 0.000011
INFO:tensorflow:Step 900 | Loss: 0.3352 | Spent: 44.5 secs | LR: 0.000011
INFO:tensorflow:Step 1000 | Loss: 0.5844 | Spent: 44.5 secs | LR: 0.000012
INFO:tensorflow:Step 1100 | Loss: 0.5365 | Spent: 44.7 secs | LR: 0.000012
INFO:tensorflow:Step 1200 | Loss: 0.5454 | Spent: 44.9 secs | LR: 0.000012
INFO:tensorflow:Step 1300 | Loss: 0.3843 | Spent: 44.5 secs | LR: 0.000012
INFO:tensorflow:Step 1400 | Loss: 0.3274 | Spent: 45.0 secs | LR: 0.000012
INFO:tensorflow:Step 1500 | Loss: 0.5204 | Spent: 44.7 secs | LR: 0.000012
INFO:tensorflow:Step 1600 | Loss: 0.3326 | Spent: 44.4 secs | LR: 0.000013
INFO:tensorflow:Step 1700 | Loss: 0.3396 | Spent: 44.6 secs | LR: 0.000013
INFO:tensorflow:Step 1800 | Loss: 0.3772 | Spent: 44.7 secs | LR: 0.000013
INFO:tensorflow:Step 1900 | Loss: 0.3757 | Spent: 44.5 secs | LR: 0.000013
INFO:tensorflow:Step 2000 | Loss: 0.3717 | Spent: 44.6 secs | LR: 0.000013
INFO:tensorflow:Step 2100 | Loss: 0.4304 | Spent: 44.9 secs | LR: 0.000013
INFO:tensorflow:Step 2200 | Loss: 0.3992 | Spent: 44.9 secs | LR: 0.000014
INFO:tensorflow:Step 2300 | Loss: 0.3812 | Spent: 44.6 secs | LR: 0.000014
INFO:tensorflow:Step 2400 | Loss: 0.5960 | Spent: 44.9 secs | LR: 0.000014
INFO:tensorflow:Step 2500 | Loss: 0.5433 | Spent: 44.5 secs | LR: 0.000014
INFO:tensorflow:Step 2600 | Loss: 0.3483 | Spent: 44.4 secs | LR: 0.000014
INFO:tensorflow:Step 2700 | Loss: 0.5280 | Spent: 44.8 secs | LR: 0.000014
INFO:tensorflow:Step 2800 | Loss: 0.5015 | Spent: 44.8 secs | LR: 0.000014
INFO:tensorflow:Step 2900 | Loss: 0.5464 | Spent: 44.7 secs | LR: 0.000015
INFO:tensorflow:Step 3000 | Loss: 0.4886 | Spent: 44.7 secs | LR: 0.000015
INFO:tensorflow:Step 3100 | Loss: 0.4396 | Spent: 44.6 secs | LR: 0.000015
INFO:tensorflow:Step 3200 | Loss: 0.5732 | Spent: 44.7 secs | LR: 0.000015
INFO:tensorflow:Step 3300 | Loss: 0.3628 | Spent: 44.7 secs | LR: 0.000015
INFO:tensorflow:Step 3400 | Loss: 0.4185 | Spent: 44.8 secs | LR: 0.000015
INFO:tensorflow:Step 3500 | Loss: 0.4944 | Spent: 44.9 secs | LR: 0.000016
INFO:tensorflow:Step 3600 | Loss: 0.4911 | Spent: 44.7 secs | LR: 0.000016
INFO:tensorflow:Step 3700 | Loss: 0.3926 | Spent: 44.6 secs | LR: 0.000016
INFO:tensorflow:Step 3800 | Loss: 0.3457 | Spent: 44.8 secs | LR: 0.000016
INFO:tensorflow:Step 3900 | Loss: 0.3514 | Spent: 44.5 secs | LR: 0.000016
INFO:tensorflow:Step 4000 | Loss: 0.3324 | Spent: 44.8 secs | LR: 0.000016
INFO:tensorflow:Step 4100 | Loss: 0.4684 | Spent: 44.3 secs | LR: 0.000017
INFO:tensorflow:Step 4200 | Loss: 0.3793 | Spent: 45.0 secs | LR: 0.000017
INFO:tensorflow:Step 4300 | Loss: 0.3481 | Spent: 44.2 secs | LR: 0.000017
INFO:tensorflow:Step 4400 | Loss: 0.3399 | Spent: 44.4 secs | LR: 0.000017
INFO:tensorflow:Step 4500 | Loss: 0.3918 | Spent: 44.7 secs | LR: 0.000017
INFO:tensorflow:Step 4600 | Loss: 0.4955 | Spent: 44.6 secs | LR: 0.000017
INFO:tensorflow:Step 4700 | Loss: 0.4218 | Spent: 45.4 secs | LR: 0.000018
INFO:tensorflow:Step 4800 | Loss: 0.3618 | Spent: 44.4 secs | LR: 0.000018
INFO:tensorflow:Step 4900 | Loss: 0.3795 | Spent: 44.9 secs | LR: 0.000018
INFO:tensorflow:Step 5000 | Loss: 0.5153 | Spent: 44.8 secs | LR: 0.000018
INFO:tensorflow:Step 5100 | Loss: 0.5062 | Spent: 44.4 secs | LR: 0.000018
INFO:tensorflow:Step 5200 | Loss: 0.3499 | Spent: 44.5 secs | LR: 0.000018
INFO:tensorflow:Step 5300 | Loss: 0.4968 | Spent: 44.7 secs | LR: 0.000018
INFO:tensorflow:Step 5400 | Loss: 0.4635 | Spent: 44.6 secs | LR: 0.000019
INFO:tensorflow:Step 5500 | Loss: 0.3608 | Spent: 44.5 secs | LR: 0.000019
INFO:tensorflow:Step 5600 | Loss: 0.6053 | Spent: 44.9 secs | LR: 0.000019
INFO:tensorflow:Step 5700 | Loss: 0.3414 | Spent: 44.5 secs | LR: 0.000019
INFO:tensorflow:Step 5800 | Loss: 0.4796 | Spent: 44.6 secs | LR: 0.000019
INFO:tensorflow:Step 5900 | Loss: 0.4905 | Spent: 44.5 secs | LR: 0.000019
INFO:tensorflow:Step 6000 | Loss: 0.4971 | Spent: 44.7 secs | LR: 0.000020
INFO:tensorflow:Step 6100 | Loss: 0.3280 | Spent: 44.7 secs | LR: 0.000020
INFO:tensorflow:Step 6200 | Loss: 0.3364 | Spent: 44.7 secs | LR: 0.000020
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.933
INFO:tensorflow:Best Accuracy: 0.933
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 6300 | Loss: 0.3264 | Spent: 486.0 secs | LR: 0.000020
INFO:tensorflow:Step 6400 | Loss: 0.4878 | Spent: 44.8 secs | LR: 0.000020
INFO:tensorflow:Step 6500 | Loss: 0.3280 | Spent: 44.5 secs | LR: 0.000020
INFO:tensorflow:Step 6600 | Loss: 0.4160 | Spent: 44.7 secs | LR: 0.000021
INFO:tensorflow:Step 6700 | Loss: 0.3444 | Spent: 44.6 secs | LR: 0.000021
INFO:tensorflow:Step 6800 | Loss: 0.4624 | Spent: 44.8 secs | LR: 0.000021
INFO:tensorflow:Step 6900 | Loss: 0.3606 | Spent: 44.4 secs | LR: 0.000021
INFO:tensorflow:Step 7000 | Loss: 0.5425 | Spent: 44.6 secs | LR: 0.000021
INFO:tensorflow:Step 7100 | Loss: 0.5896 | Spent: 44.5 secs | LR: 0.000021
INFO:tensorflow:Step 7200 | Loss: 0.3393 | Spent: 44.8 secs | LR: 0.000022
INFO:tensorflow:Step 7300 | Loss: 0.4453 | Spent: 45.3 secs | LR: 0.000022
INFO:tensorflow:Step 7400 | Loss: 0.3495 | Spent: 45.5 secs | LR: 0.000022
INFO:tensorflow:Step 7500 | Loss: 0.3278 | Spent: 44.9 secs | LR: 0.000022
INFO:tensorflow:Step 7600 | Loss: 0.3373 | Spent: 44.6 secs | LR: 0.000022
INFO:tensorflow:Step 7700 | Loss: 0.3267 | Spent: 44.7 secs | LR: 0.000022
INFO:tensorflow:Step 7800 | Loss: 0.5522 | Spent: 44.6 secs | LR: 0.000022
INFO:tensorflow:Step 7900 | Loss: 0.3308 | Spent: 44.6 secs | LR: 0.000023
INFO:tensorflow:Step 8000 | Loss: 0.4926 | Spent: 44.9 secs | LR: 0.000023
INFO:tensorflow:Step 8100 | Loss: 0.5725 | Spent: 45.0 secs | LR: 0.000023
INFO:tensorflow:Step 8200 | Loss: 0.3560 | Spent: 44.6 secs | LR: 0.000023
INFO:tensorflow:Step 8300 | Loss: 0.3372 | Spent: 44.5 secs | LR: 0.000023
INFO:tensorflow:Step 8400 | Loss: 0.3508 | Spent: 45.0 secs | LR: 0.000023
INFO:tensorflow:Step 8500 | Loss: 0.3361 | Spent: 44.5 secs | LR: 0.000024
INFO:tensorflow:Step 8600 | Loss: 0.5870 | Spent: 44.6 secs | LR: 0.000024
INFO:tensorflow:Step 8700 | Loss: 0.4423 | Spent: 44.8 secs | LR: 0.000024
INFO:tensorflow:Step 8800 | Loss: 0.3459 | Spent: 44.9 secs | LR: 0.000024
INFO:tensorflow:Step 8900 | Loss: 0.3274 | Spent: 44.7 secs | LR: 0.000024
INFO:tensorflow:Step 9000 | Loss: 0.3327 | Spent: 44.7 secs | LR: 0.000024
INFO:tensorflow:Step 9100 | Loss: 0.3278 | Spent: 44.8 secs | LR: 0.000025
INFO:tensorflow:Step 9200 | Loss: 0.3386 | Spent: 45.0 secs | LR: 0.000025
INFO:tensorflow:Step 9300 | Loss: 0.4949 | Spent: 44.7 secs | LR: 0.000025
INFO:tensorflow:Step 9400 | Loss: 0.3625 | Spent: 45.1 secs | LR: 0.000025
INFO:tensorflow:Step 9500 | Loss: 0.3279 | Spent: 44.7 secs | LR: 0.000025
INFO:tensorflow:Step 9600 | Loss: 0.3504 | Spent: 44.7 secs | LR: 0.000025
INFO:tensorflow:Step 9700 | Loss: 0.4435 | Spent: 44.7 secs | LR: 0.000026
INFO:tensorflow:Step 9800 | Loss: 0.3476 | Spent: 44.7 secs | LR: 0.000026
INFO:tensorflow:Step 9900 | Loss: 0.3268 | Spent: 44.9 secs | LR: 0.000026
INFO:tensorflow:Step 10000 | Loss: 0.3259 | Spent: 44.9 secs | LR: 0.000026
INFO:tensorflow:Step 10100 | Loss: 0.3385 | Spent: 45.0 secs | LR: 0.000026
INFO:tensorflow:Step 10200 | Loss: 0.3270 | Spent: 44.8 secs | LR: 0.000026
INFO:tensorflow:Step 10300 | Loss: 0.3271 | Spent: 44.8 secs | LR: 0.000026
INFO:tensorflow:Step 10400 | Loss: 0.3718 | Spent: 44.6 secs | LR: 0.000027
INFO:tensorflow:Step 10500 | Loss: 0.3266 | Spent: 44.7 secs | LR: 0.000027
INFO:tensorflow:Step 10600 | Loss: 0.3290 | Spent: 45.0 secs | LR: 0.000027
INFO:tensorflow:Step 10700 | Loss: 0.3262 | Spent: 44.3 secs | LR: 0.000027
INFO:tensorflow:Step 10800 | Loss: 0.3300 | Spent: 45.0 secs | LR: 0.000027
INFO:tensorflow:Step 10900 | Loss: 0.5360 | Spent: 44.8 secs | LR: 0.000027
INFO:tensorflow:Step 11000 | Loss: 0.3310 | Spent: 44.4 secs | LR: 0.000028
INFO:tensorflow:Step 11100 | Loss: 0.4993 | Spent: 44.5 secs | LR: 0.000028
INFO:tensorflow:Step 11200 | Loss: 0.4683 | Spent: 44.5 secs | LR: 0.000028
INFO:tensorflow:Step 11300 | Loss: 0.3264 | Spent: 44.9 secs | LR: 0.000028
INFO:tensorflow:Step 11400 | Loss: 0.4810 | Spent: 44.6 secs | LR: 0.000028
INFO:tensorflow:Step 11500 | Loss: 0.3320 | Spent: 44.9 secs | LR: 0.000028
INFO:tensorflow:Step 11600 | Loss: 0.3272 | Spent: 44.7 secs | LR: 0.000029
INFO:tensorflow:Step 11700 | Loss: 0.3267 | Spent: 44.7 secs | LR: 0.000029
INFO:tensorflow:Step 11800 | Loss: 0.3417 | Spent: 44.4 secs | LR: 0.000029
INFO:tensorflow:Step 11900 | Loss: 0.3327 | Spent: 44.7 secs | LR: 0.000029
INFO:tensorflow:Step 12000 | Loss: 0.5267 | Spent: 44.9 secs | LR: 0.000029
INFO:tensorflow:Step 12100 | Loss: 0.4762 | Spent: 44.8 secs | LR: 0.000029
INFO:tensorflow:Step 12200 | Loss: 0.4746 | Spent: 45.2 secs | LR: 0.000030
INFO:tensorflow:Step 12300 | Loss: 0.3316 | Spent: 44.8 secs | LR: 0.000030
INFO:tensorflow:Step 12400 | Loss: 0.4874 | Spent: 44.8 secs | LR: 0.000030
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.944
INFO:tensorflow:Best Accuracy: 0.944
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 12500 | Loss: 0.3306 | Spent: 487.7 secs | LR: 0.000030
INFO:tensorflow:Step 12600 | Loss: 0.3383 | Spent: 44.8 secs | LR: 0.000030
INFO:tensorflow:Step 12700 | Loss: 0.3276 | Spent: 44.4 secs | LR: 0.000030
INFO:tensorflow:Step 12800 | Loss: 0.3763 | Spent: 45.0 secs | LR: 0.000030
INFO:tensorflow:Step 12900 | Loss: 0.3261 | Spent: 44.8 secs | LR: 0.000029
INFO:tensorflow:Step 13000 | Loss: 0.3267 | Spent: 44.9 secs | LR: 0.000029
INFO:tensorflow:Step 13100 | Loss: 0.3348 | Spent: 44.8 secs | LR: 0.000029
INFO:tensorflow:Step 13200 | Loss: 0.4300 | Spent: 45.0 secs | LR: 0.000029
INFO:tensorflow:Step 13300 | Loss: 0.3277 | Spent: 44.9 secs | LR: 0.000029
INFO:tensorflow:Step 13400 | Loss: 0.4323 | Spent: 45.0 secs | LR: 0.000029
INFO:tensorflow:Step 13500 | Loss: 0.5061 | Spent: 44.7 secs | LR: 0.000028
INFO:tensorflow:Step 13600 | Loss: 0.3265 | Spent: 45.0 secs | LR: 0.000028
INFO:tensorflow:Step 13700 | Loss: 0.3281 | Spent: 44.8 secs | LR: 0.000028
INFO:tensorflow:Step 13800 | Loss: 0.3489 | Spent: 44.9 secs | LR: 0.000028
INFO:tensorflow:Step 13900 | Loss: 0.3350 | Spent: 44.5 secs | LR: 0.000028
INFO:tensorflow:Step 14000 | Loss: 0.3268 | Spent: 45.0 secs | LR: 0.000028
INFO:tensorflow:Step 14100 | Loss: 0.3262 | Spent: 44.7 secs | LR: 0.000027
INFO:tensorflow:Step 14200 | Loss: 0.4429 | Spent: 44.6 secs | LR: 0.000027
INFO:tensorflow:Step 14300 | Loss: 0.3260 | Spent: 44.5 secs | LR: 0.000027
INFO:tensorflow:Step 14400 | Loss: 0.3416 | Spent: 44.9 secs | LR: 0.000027
INFO:tensorflow:Step 14500 | Loss: 0.3271 | Spent: 44.3 secs | LR: 0.000027
INFO:tensorflow:Step 14600 | Loss: 0.3274 | Spent: 45.1 secs | LR: 0.000027
INFO:tensorflow:Step 14700 | Loss: 0.5500 | Spent: 45.9 secs | LR: 0.000026
INFO:tensorflow:Step 14800 | Loss: 0.3419 | Spent: 44.7 secs | LR: 0.000026
INFO:tensorflow:Step 14900 | Loss: 0.3397 | Spent: 44.7 secs | LR: 0.000026
INFO:tensorflow:Step 15000 | Loss: 0.3282 | Spent: 45.2 secs | LR: 0.000026
INFO:tensorflow:Step 15100 | Loss: 0.3260 | Spent: 45.0 secs | LR: 0.000026
INFO:tensorflow:Step 15200 | Loss: 0.4951 | Spent: 44.8 secs | LR: 0.000026
INFO:tensorflow:Step 15300 | Loss: 0.5341 | Spent: 45.3 secs | LR: 0.000026
INFO:tensorflow:Step 15400 | Loss: 0.4507 | Spent: 44.9 secs | LR: 0.000025
INFO:tensorflow:Step 15500 | Loss: 0.3283 | Spent: 45.1 secs | LR: 0.000025
INFO:tensorflow:Step 15600 | Loss: 0.5348 | Spent: 45.1 secs | LR: 0.000025
INFO:tensorflow:Step 15700 | Loss: 0.4832 | Spent: 44.9 secs | LR: 0.000025
INFO:tensorflow:Step 15800 | Loss: 0.5047 | Spent: 44.8 secs | LR: 0.000025
INFO:tensorflow:Step 15900 | Loss: 0.4627 | Spent: 45.0 secs | LR: 0.000025
INFO:tensorflow:Step 16000 | Loss: 0.3297 | Spent: 44.8 secs | LR: 0.000024
INFO:tensorflow:Step 16100 | Loss: 0.3291 | Spent: 45.1 secs | LR: 0.000024
INFO:tensorflow:Step 16200 | Loss: 0.3318 | Spent: 45.0 secs | LR: 0.000024
INFO:tensorflow:Step 16300 | Loss: 0.3265 | Spent: 44.9 secs | LR: 0.000024
INFO:tensorflow:Step 16400 | Loss: 0.3290 | Spent: 44.8 secs | LR: 0.000024
INFO:tensorflow:Step 16500 | Loss: 0.3299 | Spent: 44.6 secs | LR: 0.000024
INFO:tensorflow:Step 16600 | Loss: 0.3276 | Spent: 44.5 secs | LR: 0.000023
INFO:tensorflow:Step 16700 | Loss: 0.4525 | Spent: 45.0 secs | LR: 0.000023
INFO:tensorflow:Step 16800 | Loss: 0.3287 | Spent: 45.1 secs | LR: 0.000023
INFO:tensorflow:Step 16900 | Loss: 0.3288 | Spent: 45.0 secs | LR: 0.000023
INFO:tensorflow:Step 17000 | Loss: 0.5101 | Spent: 45.0 secs | LR: 0.000023
INFO:tensorflow:Step 17100 | Loss: 0.4731 | Spent: 44.8 secs | LR: 0.000023
INFO:tensorflow:Step 17200 | Loss: 0.3287 | Spent: 44.8 secs | LR: 0.000022
INFO:tensorflow:Step 17300 | Loss: 0.3266 | Spent: 44.8 secs | LR: 0.000022
INFO:tensorflow:Step 17400 | Loss: 0.3299 | Spent: 44.8 secs | LR: 0.000022
INFO:tensorflow:Step 17500 | Loss: 0.4502 | Spent: 45.1 secs | LR: 0.000022
INFO:tensorflow:Step 17600 | Loss: 0.3271 | Spent: 44.8 secs | LR: 0.000022
INFO:tensorflow:Step 17700 | Loss: 0.3295 | Spent: 44.9 secs | LR: 0.000022
INFO:tensorflow:Step 17800 | Loss: 0.4611 | Spent: 44.6 secs | LR: 0.000022
INFO:tensorflow:Step 17900 | Loss: 0.3301 | Spent: 44.7 secs | LR: 0.000021
INFO:tensorflow:Step 18000 | Loss: 0.3275 | Spent: 45.0 secs | LR: 0.000021
INFO:tensorflow:Step 18100 | Loss: 0.5254 | Spent: 45.0 secs | LR: 0.000021
INFO:tensorflow:Step 18200 | Loss: 0.3331 | Spent: 44.5 secs | LR: 0.000021
INFO:tensorflow:Step 18300 | Loss: 0.3285 | Spent: 44.9 secs | LR: 0.000021
INFO:tensorflow:Step 18400 | Loss: 0.3433 | Spent: 45.1 secs | LR: 0.000021
INFO:tensorflow:Step 18500 | Loss: 0.3384 | Spent: 44.7 secs | LR: 0.000020
INFO:tensorflow:Step 18600 | Loss: 0.4522 | Spent: 45.2 secs | LR: 0.000020
INFO:tensorflow:Step 18700 | Loss: 0.3272 | Spent: 45.0 secs | LR: 0.000020
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.942
INFO:tensorflow:Best Accuracy: 0.944
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 18800 | Loss: 0.3264 | Spent: 492.8 secs | LR: 0.000020
INFO:tensorflow:Step 18900 | Loss: 0.3269 | Spent: 45.5 secs | LR: 0.000020
INFO:tensorflow:Step 19000 | Loss: 0.3271 | Spent: 45.2 secs | LR: 0.000020
INFO:tensorflow:Step 19100 | Loss: 0.3286 | Spent: 45.1 secs | LR: 0.000019
INFO:tensorflow:Step 19200 | Loss: 0.4994 | Spent: 45.4 secs | LR: 0.000019
INFO:tensorflow:Step 19300 | Loss: 0.3263 | Spent: 45.3 secs | LR: 0.000019
INFO:tensorflow:Step 19400 | Loss: 0.3255 | Spent: 45.0 secs | LR: 0.000019
INFO:tensorflow:Step 19500 | Loss: 0.3273 | Spent: 45.3 secs | LR: 0.000019
INFO:tensorflow:Step 19600 | Loss: 0.3272 | Spent: 45.2 secs | LR: 0.000019
INFO:tensorflow:Step 19700 | Loss: 0.3265 | Spent: 45.3 secs | LR: 0.000018
INFO:tensorflow:Step 19800 | Loss: 0.3300 | Spent: 45.6 secs | LR: 0.000018
INFO:tensorflow:Step 19900 | Loss: 0.3270 | Spent: 45.7 secs | LR: 0.000018
INFO:tensorflow:Step 20000 | Loss: 0.3282 | Spent: 45.4 secs | LR: 0.000018
INFO:tensorflow:Step 20100 | Loss: 0.4872 | Spent: 45.3 secs | LR: 0.000018
INFO:tensorflow:Step 20200 | Loss: 0.5375 | Spent: 45.4 secs | LR: 0.000018
INFO:tensorflow:Step 20300 | Loss: 0.3265 | Spent: 45.4 secs | LR: 0.000018
INFO:tensorflow:Step 20400 | Loss: 0.5571 | Spent: 45.3 secs | LR: 0.000017
INFO:tensorflow:Step 20500 | Loss: 0.3258 | Spent: 45.3 secs | LR: 0.000017
INFO:tensorflow:Step 20600 | Loss: 0.3294 | Spent: 45.4 secs | LR: 0.000017
INFO:tensorflow:Step 20700 | Loss: 0.4630 | Spent: 44.9 secs | LR: 0.000017
INFO:tensorflow:Step 20800 | Loss: 0.3260 | Spent: 44.8 secs | LR: 0.000017
INFO:tensorflow:Step 20900 | Loss: 0.3271 | Spent: 45.2 secs | LR: 0.000017
INFO:tensorflow:Step 21000 | Loss: 0.3257 | Spent: 44.8 secs | LR: 0.000016
INFO:tensorflow:Step 21100 | Loss: 0.3267 | Spent: 45.2 secs | LR: 0.000016
INFO:tensorflow:Step 21200 | Loss: 0.5566 | Spent: 45.0 secs | LR: 0.000016
INFO:tensorflow:Step 21300 | Loss: 0.3257 | Spent: 45.3 secs | LR: 0.000016
INFO:tensorflow:Step 21400 | Loss: 0.3261 | Spent: 45.2 secs | LR: 0.000016
INFO:tensorflow:Step 21500 | Loss: 0.3266 | Spent: 45.1 secs | LR: 0.000016
INFO:tensorflow:Step 21600 | Loss: 0.3270 | Spent: 45.2 secs | LR: 0.000015
INFO:tensorflow:Step 21700 | Loss: 0.3277 | Spent: 45.3 secs | LR: 0.000015
INFO:tensorflow:Step 21800 | Loss: 0.3257 | Spent: 46.2 secs | LR: 0.000015
INFO:tensorflow:Step 21900 | Loss: 0.3260 | Spent: 45.7 secs | LR: 0.000015
INFO:tensorflow:Step 22000 | Loss: 0.4840 | Spent: 45.8 secs | LR: 0.000015
INFO:tensorflow:Step 22100 | Loss: 0.3263 | Spent: 45.1 secs | LR: 0.000015
INFO:tensorflow:Step 22200 | Loss: 0.3357 | Spent: 44.9 secs | LR: 0.000014
INFO:tensorflow:Step 22300 | Loss: 0.3267 | Spent: 45.2 secs | LR: 0.000014
INFO:tensorflow:Step 22400 | Loss: 0.3259 | Spent: 45.0 secs | LR: 0.000014
INFO:tensorflow:Step 22500 | Loss: 0.3256 | Spent: 45.2 secs | LR: 0.000014
INFO:tensorflow:Step 22600 | Loss: 0.3263 | Spent: 45.3 secs | LR: 0.000014
INFO:tensorflow:Step 22700 | Loss: 0.3258 | Spent: 45.4 secs | LR: 0.000014
INFO:tensorflow:Step 22800 | Loss: 0.7530 | Spent: 45.4 secs | LR: 0.000014
INFO:tensorflow:Step 22900 | Loss: 0.3255 | Spent: 45.5 secs | LR: 0.000013
INFO:tensorflow:Step 23000 | Loss: 0.3287 | Spent: 45.0 secs | LR: 0.000013
INFO:tensorflow:Step 23100 | Loss: 0.3259 | Spent: 45.3 secs | LR: 0.000013
INFO:tensorflow:Step 23200 | Loss: 0.3279 | Spent: 45.3 secs | LR: 0.000013
INFO:tensorflow:Step 23300 | Loss: 0.4298 | Spent: 45.2 secs | LR: 0.000013
INFO:tensorflow:Step 23400 | Loss: 0.3272 | Spent: 45.5 secs | LR: 0.000013
INFO:tensorflow:Step 23500 | Loss: 0.3272 | Spent: 45.1 secs | LR: 0.000012
INFO:tensorflow:Step 23600 | Loss: 0.3280 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 23700 | Loss: 0.3258 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 23800 | Loss: 0.3276 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 23900 | Loss: 0.3536 | Spent: 45.0 secs | LR: 0.000012
INFO:tensorflow:Step 24000 | Loss: 0.3957 | Spent: 45.5 secs | LR: 0.000012
INFO:tensorflow:Step 24100 | Loss: 0.3270 | Spent: 45.1 secs | LR: 0.000011
INFO:tensorflow:Step 24200 | Loss: 0.3263 | Spent: 45.1 secs | LR: 0.000011
INFO:tensorflow:Step 24300 | Loss: 0.3265 | Spent: 45.1 secs | LR: 0.000011
INFO:tensorflow:Step 24400 | Loss: 0.3282 | Spent: 45.2 secs | LR: 0.000011
INFO:tensorflow:Step 24500 | Loss: 0.3257 | Spent: 45.2 secs | LR: 0.000011
INFO:tensorflow:Step 24600 | Loss: 0.4458 | Spent: 45.4 secs | LR: 0.000011
INFO:tensorflow:Step 24700 | Loss: 0.3255 | Spent: 45.5 secs | LR: 0.000010
INFO:tensorflow:Step 24800 | Loss: 0.3282 | Spent: 45.5 secs | LR: 0.000010
INFO:tensorflow:Step 24900 | Loss: 0.3254 | Spent: 44.9 secs | LR: 0.000010
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.947
INFO:tensorflow:Best Accuracy: 0.947
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt
Reading ../data/train_bt_part6.txt
INFO:tensorflow:Step 25000 | Loss: 0.3260 | Spent: 496.5 secs | LR: 0.000010
INFO:tensorflow:Step 25100 | Loss: 0.3256 | Spent: 45.8 secs | LR: 0.000010
INFO:tensorflow:Step 25200 | Loss: 0.3272 | Spent: 45.2 secs | LR: 0.000010
INFO:tensorflow:Step 25300 | Loss: 0.3258 | Spent: 45.4 secs | LR: 0.000010
INFO:tensorflow:Step 25400 | Loss: 0.3259 | Spent: 45.1 secs | LR: 0.000010
INFO:tensorflow:Step 25500 | Loss: 0.3258 | Spent: 45.0 secs | LR: 0.000010
INFO:tensorflow:Step 25600 | Loss: 0.3260 | Spent: 44.9 secs | LR: 0.000010
INFO:tensorflow:Step 25700 | Loss: 0.3261 | Spent: 45.3 secs | LR: 0.000011
INFO:tensorflow:Step 25800 | Loss: 0.3258 | Spent: 45.0 secs | LR: 0.000011
INFO:tensorflow:Step 25900 | Loss: 0.3279 | Spent: 45.0 secs | LR: 0.000011
INFO:tensorflow:Step 26000 | Loss: 0.3260 | Spent: 44.8 secs | LR: 0.000011
INFO:tensorflow:Step 26100 | Loss: 0.3262 | Spent: 44.8 secs | LR: 0.000011
INFO:tensorflow:Step 26200 | Loss: 0.3254 | Spent: 45.2 secs | LR: 0.000011
INFO:tensorflow:Step 26300 | Loss: 0.5372 | Spent: 44.8 secs | LR: 0.000011
INFO:tensorflow:Step 26400 | Loss: 0.3256 | Spent: 44.8 secs | LR: 0.000011
INFO:tensorflow:Step 26500 | Loss: 0.3254 | Spent: 45.3 secs | LR: 0.000011
INFO:tensorflow:Step 26600 | Loss: 0.3257 | Spent: 45.0 secs | LR: 0.000011
INFO:tensorflow:Step 26700 | Loss: 0.3279 | Spent: 45.4 secs | LR: 0.000011
INFO:tensorflow:Step 26800 | Loss: 0.5233 | Spent: 45.3 secs | LR: 0.000011
INFO:tensorflow:Step 26900 | Loss: 0.3268 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 27000 | Loss: 0.3256 | Spent: 45.4 secs | LR: 0.000012
INFO:tensorflow:Step 27100 | Loss: 0.3257 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 27200 | Loss: 0.4969 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 27300 | Loss: 0.3256 | Spent: 45.3 secs | LR: 0.000012
INFO:tensorflow:Step 27400 | Loss: 0.3256 | Spent: 45.4 secs | LR: 0.000012
INFO:tensorflow:Step 27500 | Loss: 0.3261 | Spent: 45.5 secs | LR: 0.000012
INFO:tensorflow:Step 27600 | Loss: 0.3264 | Spent: 45.5 secs | LR: 0.000012
INFO:tensorflow:Step 27700 | Loss: 0.3260 | Spent: 45.1 secs | LR: 0.000012
INFO:tensorflow:Step 27800 | Loss: 0.3317 | Spent: 45.9 secs | LR: 0.000012
INFO:tensorflow:Step 27900 | Loss: 0.3256 | Spent: 45.5 secs | LR: 0.000012
INFO:tensorflow:Step 28000 | Loss: 0.3269 | Spent: 45.5 secs | LR: 0.000012
INFO:tensorflow:Step 28100 | Loss: 0.3257 | Spent: 45.7 secs | LR: 0.000012
INFO:tensorflow:Step 28200 | Loss: 0.4445 | Spent: 45.7 secs | LR: 0.000013
INFO:tensorflow:Step 28300 | Loss: 0.3256 | Spent: 45.7 secs | LR: 0.000013
INFO:tensorflow:Step 28400 | Loss: 0.5364 | Spent: 45.8 secs | LR: 0.000013
INFO:tensorflow:Step 28500 | Loss: 0.3272 | Spent: 45.8 secs | LR: 0.000013
INFO:tensorflow:Step 28600 | Loss: 0.3254 | Spent: 45.3 secs | LR: 0.000013
INFO:tensorflow:Step 28700 | Loss: 0.3273 | Spent: 45.1 secs | LR: 0.000013
INFO:tensorflow:Step 28800 | Loss: 0.3265 | Spent: 45.2 secs | LR: 0.000013
INFO:tensorflow:Step 28900 | Loss: 0.3304 | Spent: 45.2 secs | LR: 0.000013
INFO:tensorflow:Step 29000 | Loss: 0.3255 | Spent: 45.3 secs | LR: 0.000013
INFO:tensorflow:Step 29100 | Loss: 0.3258 | Spent: 45.3 secs | LR: 0.000013
INFO:tensorflow:Step 29200 | Loss: 0.3262 | Spent: 45.8 secs | LR: 0.000013
INFO:tensorflow:Step 29300 | Loss: 0.3263 | Spent: 45.1 secs | LR: 0.000013
INFO:tensorflow:Step 29400 | Loss: 0.3261 | Spent: 45.3 secs | LR: 0.000014
INFO:tensorflow:Step 29500 | Loss: 0.3262 | Spent: 45.1 secs | LR: 0.000014
INFO:tensorflow:Step 29600 | Loss: 0.3263 | Spent: 45.4 secs | LR: 0.000014
INFO:tensorflow:Step 29700 | Loss: 0.3259 | Spent: 45.4 secs | LR: 0.000014
INFO:tensorflow:Step 29800 | Loss: 0.3263 | Spent: 45.5 secs | LR: 0.000014
INFO:tensorflow:Step 29900 | Loss: 0.3259 | Spent: 45.5 secs | LR: 0.000014
INFO:tensorflow:Step 30000 | Loss: 0.3273 | Spent: 45.2 secs | LR: 0.000014
INFO:tensorflow:Step 30100 | Loss: 0.3259 | Spent: 44.9 secs | LR: 0.000014
INFO:tensorflow:Step 30200 | Loss: 0.3255 | Spent: 45.0 secs | LR: 0.000014
INFO:tensorflow:Step 30300 | Loss: 0.3259 | Spent: 44.8 secs | LR: 0.000014
INFO:tensorflow:Step 30400 | Loss: 0.3256 | Spent: 45.2 secs | LR: 0.000014
INFO:tensorflow:Step 30500 | Loss: 0.3255 | Spent: 45.0 secs | LR: 0.000014
INFO:tensorflow:Step 30600 | Loss: 0.3254 | Spent: 45.2 secs | LR: 0.000014
INFO:tensorflow:Step 30700 | Loss: 0.3371 | Spent: 45.1 secs | LR: 0.000015
INFO:tensorflow:Step 30800 | Loss: 0.3262 | Spent: 44.8 secs | LR: 0.000015
INFO:tensorflow:Step 30900 | Loss: 0.5159 | Spent: 45.0 secs | LR: 0.000015
INFO:tensorflow:Step 31000 | Loss: 0.3255 | Spent: 45.1 secs | LR: 0.000015
INFO:tensorflow:Step 31100 | Loss: 0.3262 | Spent: 45.1 secs | LR: 0.000015
INFO:tensorflow:Step 31200 | Loss: 0.3266 | Spent: 44.9 secs | LR: 0.000015
Reading ../data/test.txt
INFO:tensorflow:Evaluation: Testing Accuracy: 0.941
INFO:tensorflow:Best Accuracy: 0.947
Reading ../data/train_bt_part1.txt
Reading ../data/train_bt_part2.txt
Reading ../data/train_bt_part3.txt
Reading ../data/train_bt_part4.txt
Reading ../data/train_bt_part5.txt