observer_test.py 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154
  1. import numpy as np
  2. import unittest
  3. from hypothesis import given, settings
  4. import hypothesis.strategies as st
  5. from caffe2.python import brew, core, model_helper, rnn_cell
  6. import caffe2.python.workspace as ws
  7. class TestObservers(unittest.TestCase):
  8. def setUp(self):
  9. core.GlobalInit(["python", "caffe2"])
  10. ws.ResetWorkspace()
  11. self.model = model_helper.ModelHelper()
  12. brew.fc(self.model, "data", "y",
  13. dim_in=4, dim_out=2,
  14. weight_init=('ConstantFill', dict(value=1.0)),
  15. bias_init=('ConstantFill', dict(value=0.0)),
  16. axis=0)
  17. ws.FeedBlob("data", np.zeros([4], dtype='float32'))
  18. ws.RunNetOnce(self.model.param_init_net)
  19. ws.CreateNet(self.model.net)
  20. def testObserver(self):
  21. ob = self.model.net.AddObserver("TimeObserver")
  22. ws.RunNet(self.model.net)
  23. print(ob.average_time())
  24. num = self.model.net.NumObservers()
  25. self.model.net.RemoveObserver(ob)
  26. assert(self.model.net.NumObservers() + 1 == num)
  27. @given(
  28. num_layers=st.integers(1, 4),
  29. forward_only=st.booleans()
  30. )
  31. @settings(deadline=1000)
  32. def test_observer_rnn_executor(self, num_layers, forward_only):
  33. '''
  34. Test that the RNN executor produces same results as
  35. the non-executor (i.e running step nets as sequence of simple nets).
  36. '''
  37. Tseq = [2, 3, 4]
  38. batch_size = 10
  39. input_dim = 3
  40. hidden_dim = 3
  41. run_cnt = [0] * len(Tseq)
  42. avg_time = [0] * len(Tseq)
  43. for j in range(len(Tseq)):
  44. T = Tseq[j]
  45. ws.ResetWorkspace()
  46. ws.FeedBlob(
  47. "seq_lengths",
  48. np.array([T] * batch_size, dtype=np.int32)
  49. )
  50. ws.FeedBlob("target", np.random.rand(
  51. T, batch_size, hidden_dim).astype(np.float32))
  52. ws.FeedBlob("hidden_init", np.zeros(
  53. [1, batch_size, hidden_dim], dtype=np.float32
  54. ))
  55. ws.FeedBlob("cell_init", np.zeros(
  56. [1, batch_size, hidden_dim], dtype=np.float32
  57. ))
  58. model = model_helper.ModelHelper(name="lstm")
  59. model.net.AddExternalInputs(["input"])
  60. init_blobs = []
  61. for i in range(num_layers):
  62. hidden_init, cell_init = model.net.AddExternalInputs(
  63. "hidden_init_{}".format(i),
  64. "cell_init_{}".format(i)
  65. )
  66. init_blobs.extend([hidden_init, cell_init])
  67. output, last_hidden, _, last_state = rnn_cell.LSTM(
  68. model=model,
  69. input_blob="input",
  70. seq_lengths="seq_lengths",
  71. initial_states=init_blobs,
  72. dim_in=input_dim,
  73. dim_out=[hidden_dim] * num_layers,
  74. drop_states=True,
  75. forward_only=forward_only,
  76. return_last_layer_only=True,
  77. )
  78. loss = model.AveragedLoss(
  79. model.SquaredL2Distance([output, "target"], "dist"),
  80. "loss"
  81. )
  82. # Add gradient ops
  83. if not forward_only:
  84. model.AddGradientOperators([loss])
  85. # init
  86. for init_blob in init_blobs:
  87. ws.FeedBlob(init_blob, np.zeros(
  88. [1, batch_size, hidden_dim], dtype=np.float32
  89. ))
  90. ws.RunNetOnce(model.param_init_net)
  91. # Run with executor
  92. self.enable_rnn_executor(model.net, 1, forward_only)
  93. np.random.seed(10022015)
  94. input_shape = [T, batch_size, input_dim]
  95. ws.FeedBlob(
  96. "input",
  97. np.random.rand(*input_shape).astype(np.float32)
  98. )
  99. ws.FeedBlob(
  100. "target",
  101. np.random.rand(
  102. T,
  103. batch_size,
  104. hidden_dim
  105. ).astype(np.float32)
  106. )
  107. ws.CreateNet(model.net, overwrite=True)
  108. time_ob = model.net.AddObserver("TimeObserver")
  109. run_cnt_ob = model.net.AddObserver("RunCountObserver")
  110. ws.RunNet(model.net)
  111. avg_time[j] = time_ob.average_time()
  112. run_cnt[j] = int(''.join(x for x in run_cnt_ob.debug_info() if x.isdigit()))
  113. model.net.RemoveObserver(time_ob)
  114. model.net.RemoveObserver(run_cnt_ob)
  115. print(avg_time)
  116. print(run_cnt)
  117. self.assertTrue(run_cnt[1] > run_cnt[0] and run_cnt[2] > run_cnt[1])
  118. self.assertEqual(run_cnt[1] - run_cnt[0], run_cnt[2] - run_cnt[1])
  119. def enable_rnn_executor(self, net, value, forward_only):
  120. num_found = 0
  121. for op in net.Proto().op:
  122. if op.type.startswith("RecurrentNetwork"):
  123. for arg in op.arg:
  124. if arg.name == 'enable_rnn_executor':
  125. arg.i = value
  126. num_found += 1
  127. # This sanity check is so that if someone changes the
  128. # enable_rnn_executor parameter name, the test will
  129. # start failing as this function will become defective.
  130. self.assertEqual(1 if forward_only else 2, num_found)