In [1]:
import tensorflow as tf
import argparse
import time
import pickle
import numpy as np
import os
os.environ["TF_CPP_MIN_LOG_LEVEL"]="2"

from utils import DataLoader
from BiRNNLayer import BiRNNLayer
from PointerLayer import PointerLayer
from AttentionLayer import AttentionLayer

data_dir = 'data'
output_keep_prob = 1.0
input_keep_prob = 1.0
batch_size = 10
num_epochs = 10
rnn_size = 128
learning_rate = 0.002
decay_rate = 0.97

data_loader = DataLoader(data_dir, batch_size)
data_loader.create_batches()
max_para_length = data_loader.max_para_length
max_ques_length = data_loader.max_ques_length
vocab_size = data_loader.vocab_size

#Initialize layers
paragraph_layer = BiRNNLayer(vocab_size, batch_size=batch_size, scope="paraBiRNN")
question_layer = BiRNNLayer(vocab_size, batch_size=batch_size, scope="quesBiRNN")
attention_layer = AttentionLayer(paragraph_layer.outputs, question_layer.outputs, batch_size=batch_size, hidden_size=rnn_size, scope="attention")
output_layer = PointerLayer(attention_layer.outputs, batch_size=batch_size, scope="pointer")


loading preprocessed data...
loading vocab file...
building BiRNNLayer paraBiRNN
building BiRNNLayer quesBiRNN
building attention layer attention
building pointer layer pointer

In [2]:
with tf.Session() as sess:
    sess.run(tf.global_variables_initializer())
    for e in range(num_epochs):
        sess.run(tf.assign(output_layer.learning_rate, learning_rate * (decay_rate ** e)))
        for b in range(data_loader.num_batches):
            start = time.time()
            paragraphs, p_length, questions, q_length, targets_start, targets_end = data_loader.next_batch_variable_seq_length()
            print([len(p) for p in paragraphs])
            feed = {paragraph_layer.inputs: paragraphs,
                    paragraph_layer.seq_length: p_length,
                    question_layer.inputs: questions,
                    question_layer.seq_length: q_length,
                    output_layer.targets_start: targets_start, 
                    output_layer.targets_end: targets_end}
            train_loss, p1, p2, a, b, c, _ = sess.run([output_layer.cost, output_layer.p1, output_layer.p2, output_layer.a, output_layer.b, output_layer.c, output_layer.train_op], feed)

            end = time.time()
            print("{}/{} (epoch {}), train_loss = {:.3f}, time/batch = {:.3f}"
                  .format(e * data_loader.num_batches + b,
                          num_epochs * data_loader.num_batches,
                          e, train_loss, end - start))


heyyy???
572fa64db2c2fd14005682ab
573033c3a23a5019007fcf72
572e7aa8dfa6aa1500f8d00f
5727b1adff5b5019007d92c1
5726d11ef1498d1400e8ec2e
5727b2b2ff5b5019007d92d2
56df10063277331400b4d92b
5726e5c9f1498d1400e8ef3a
5706477d75f01819005e7af8
572f618b04bcaa1900d768a6
248 17
[248, 248, 248, 248, 248, 248, 248, 248, 248, 248]
[ 0.          0.0039733   0.0040125   0.          0.          0.00408616
  0.          0.00408359  0.          0.        ]/87600 (epoch 0), train_loss = inf, time/batch = 0.902
heyyy???
572ba75ff75d5e190021fe72
56d6477c1c85041400947069
57312bcd05b4da19006bce2f
5725e762271a42140099d2ff
572cbf35dfb02c14005c6c20
56fb673d8ddada1400cd63d1
56d3686b59d6e41400146307
56d5d92a1c85041400946e2f
5727ba3c2ca10214002d94cc
572f618b04bcaa1900d768a6
239 18
[239, 239, 239, 239, 239, 239, 239, 239, 239, 239]
---------------------------------------------------------------------------
InvalidArgumentError                      Traceback (most recent call last)
c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\client\session.py in _do_call(self, fn, *args)
   1038     try:
-> 1039       return fn(*args)
   1040     except errors.OpError as e:

c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\client\session.py in _run_fn(session, feed_dict, fetch_list, target_list, options, run_metadata)
   1020                                  feed_dict, fetch_list, target_list,
-> 1021                                  status, run_metadata)
   1022 

c:\users\administrator\appdata\local\programs\python\python35\lib\contextlib.py in __exit__(self, type, value, traceback)
     65             try:
---> 66                 next(self.gen)
     67             except StopIteration:

c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\framework\errors_impl.py in raise_exception_on_not_ok_status()
    465           compat.as_text(pywrap_tensorflow.TF_Message(status)),
--> 466           pywrap_tensorflow.TF_GetCode(status))
    467   finally:

InvalidArgumentError: seq_lens(1) < 0
	 [[Node: quesBiRNN_1/cell_0/bidirectional_rnn/bw/ReverseSequence = ReverseSequence[T=DT_FLOAT, Tlen=DT_INT32, batch_dim=0, seq_dim=1, _device="/job:localhost/replica:0/task:0/cpu:0"](embedding_lookup_1, Cast_1)]]

During handling of the above exception, another exception occurred:

InvalidArgumentError                      Traceback (most recent call last)
<ipython-input-2-00c3f780a5c1> in <module>()
     13                     output_layer.targets_start: targets_start,
     14                     output_layer.targets_end: targets_end}
---> 15             train_loss, p1, p2, a, b, c, _ = sess.run([output_layer.cost, output_layer.p1, output_layer.p2, output_layer.a, output_layer.b, output_layer.c, output_layer.train_op], feed)
     16 
     17             end = time.time()

c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\client\session.py in run(self, fetches, feed_dict, options, run_metadata)
    776     try:
    777       result = self._run(None, fetches, feed_dict, options_ptr,
--> 778                          run_metadata_ptr)
    779       if run_metadata:
    780         proto_data = tf_session.TF_GetBuffer(run_metadata_ptr)

c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\client\session.py in _run(self, handle, fetches, feed_dict, options, run_metadata)
    980     if final_fetches or final_targets:
    981       results = self._do_run(handle, final_targets, final_fetches,
--> 982                              feed_dict_string, options, run_metadata)
    983     else:
    984       results = []

c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\client\session.py in _do_run(self, handle, target_list, fetch_list, feed_dict, options, run_metadata)
   1030     if handle is None:
   1031       return self._do_call(_run_fn, self._session, feed_dict, fetch_list,
-> 1032                            target_list, options, run_metadata)
   1033     else:
   1034       return self._do_call(_prun_fn, self._session, handle, feed_dict,

c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\client\session.py in _do_call(self, fn, *args)
   1050         except KeyError:
   1051           pass
-> 1052       raise type(e)(node_def, op, message)
   1053 
   1054   def _extend_graph(self):

InvalidArgumentError: seq_lens(1) < 0
	 [[Node: quesBiRNN_1/cell_0/bidirectional_rnn/bw/ReverseSequence = ReverseSequence[T=DT_FLOAT, Tlen=DT_INT32, batch_dim=0, seq_dim=1, _device="/job:localhost/replica:0/task:0/cpu:0"](embedding_lookup_1, Cast_1)]]

Caused by op 'quesBiRNN_1/cell_0/bidirectional_rnn/bw/ReverseSequence', defined at:
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\runpy.py", line 193, in _run_module_as_main
    "__main__", mod_spec)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\runpy.py", line 85, in _run_code
    exec(code, run_globals)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel_launcher.py", line 16, in <module>
    app.launch_new_instance()
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\traitlets\config\application.py", line 658, in launch_instance
    app.start()
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel\kernelapp.py", line 477, in start
    ioloop.IOLoop.instance().start()
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\zmq\eventloop\ioloop.py", line 177, in start
    super(ZMQIOLoop, self).start()
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tornado\ioloop.py", line 888, in start
    handler_func(fd_obj, events)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tornado\stack_context.py", line 277, in null_wrapper
    return fn(*args, **kwargs)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\zmq\eventloop\zmqstream.py", line 440, in _handle_events
    self._handle_recv()
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\zmq\eventloop\zmqstream.py", line 472, in _handle_recv
    self._run_callback(callback, msg)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\zmq\eventloop\zmqstream.py", line 414, in _run_callback
    callback(*args, **kwargs)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tornado\stack_context.py", line 277, in null_wrapper
    return fn(*args, **kwargs)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel\kernelbase.py", line 283, in dispatcher
    return self.dispatch_shell(stream, msg)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel\kernelbase.py", line 235, in dispatch_shell
    handler(stream, idents, msg)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel\kernelbase.py", line 399, in execute_request
    user_expressions, allow_stdin)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel\ipkernel.py", line 196, in do_execute
    res = shell.run_cell(code, store_history=store_history, silent=silent)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\ipykernel\zmqshell.py", line 533, in run_cell
    return super(ZMQInteractiveShell, self).run_cell(*args, **kwargs)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\IPython\core\interactiveshell.py", line 2683, in run_cell
    interactivity=interactivity, compiler=compiler, result=result)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\IPython\core\interactiveshell.py", line 2787, in run_ast_nodes
    if self.run_code(code, result):
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\IPython\core\interactiveshell.py", line 2847, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "<ipython-input-1-fa98d11239d2>", line 31, in <module>
    question_layer = BiRNNLayer(vocab_size, batch_size=batch_size, scope="quesBiRNN")
  File "C:\Users\Administrator\repos\squad_exp\BiRNNLayer.py", line 64, in __init__
    outputs, output_states_fw, output_states_bw = rnn.stack_bidirectional_dynamic_rnn(cells_fw, cells_bw, inputs, initial_states_fw, initial_states_bw, dtype=tf.float32, sequence_length=seq_lengths, scope=scope)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\contrib\rnn\python\ops\rnn.py", line 221, in stack_bidirectional_dynamic_rnn
    dtype=dtype)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\ops\rnn.py", line 371, in bidirectional_dynamic_rnn
    seq_dim=time_dim, batch_dim=batch_dim)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\ops\rnn.py", line 364, in _reverse
    seq_dim=seq_dim, batch_dim=batch_dim)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\ops\array_ops.py", line 2333, in reverse_sequence
    name=name)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\ops\gen_array_ops.py", line 2656, in reverse_sequence
    batch_dim=batch_dim, name=name)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\framework\op_def_library.py", line 768, in apply_op
    op_def=op_def)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\framework\ops.py", line 2336, in create_op
    original_op=self._default_original_op, op_def=op_def)
  File "c:\users\administrator\appdata\local\programs\python\python35\lib\site-packages\tensorflow\python\framework\ops.py", line 1228, in __init__
    self._traceback = _extract_stack()

InvalidArgumentError (see above for traceback): seq_lens(1) < 0
	 [[Node: quesBiRNN_1/cell_0/bidirectional_rnn/bw/ReverseSequence = ReverseSequence[T=DT_FLOAT, Tlen=DT_INT32, batch_dim=0, seq_dim=1, _device="/job:localhost/replica:0/task:0/cpu:0"](embedding_lookup_1, Cast_1)]]

In [ ]: