Class: DNN::Layers::LSTMDense

Inherits:

Object

Object
DNN::Layers::LSTMDense

show all

Defined in:: lib/dnn/core/rnn_layers.rb

Instance Attribute Summary collapse

#trainable ⇒ Object

Returns the value of attribute trainable.

Instance Method Summary collapse

#backward(dh2, dc2) ⇒ Object
#forward(x, h, c) ⇒ Object
#initialize(weight, recurrent_weight, bias) ⇒ LSTMDense constructor

A new instance of LSTMDense.

Constructor Details

#initialize(weight, recurrent_weight, bias) ⇒ `LSTMDense`

Returns a new instance of LSTMDense.

# File 'lib/dnn/core/rnn_layers.rb', line 226

def initialize(weight, recurrent_weight, bias)
  @weight = weight
  @recurrent_weight = recurrent_weight
  @bias = bias
  @tanh = Layers::Tanh.new
  @g_tanh = Layers::Tanh.new
  @forget_sigmoid = Layers::Sigmoid.new
  @in_sigmoid = Layers::Sigmoid.new
  @out_sigmoid = Layers::Sigmoid.new
  @trainable = true
end

Instance Attribute Details

#trainable ⇒ `Object`

Returns the value of attribute trainable.



224
225
226

# File 'lib/dnn/core/rnn_layers.rb', line 224

def trainable
  @trainable
end

Instance Method Details

#backward(dh2, dc2) ⇒ `Object`

# File 'lib/dnn/core/rnn_layers.rb', line 257

def backward(dh2, dc2)
  dh2_tmp = @tanh_c2 * dh2
  dc2_tmp = @tanh.backward(@out * dh2) + dc2

  dout = @out_sigmoid.backward(dh2_tmp)
  din = @in_sigmoid.backward(dc2_tmp * @g)
  dg = @g_tanh.backward(dc2_tmp * @in)
  dforget = @forget_sigmoid.backward(dc2_tmp * @c)

  da = Xumo::SFloat.hstack([dforget, dg, din, dout])

  if @trainable
    @weight.grad += @x.transpose.dot(da)
    @recurrent_weight.grad += @h.transpose.dot(da)
    @bias.grad += da.sum(0) if @bias
  end
  dx = da.dot(@weight.data.transpose)
  dh = da.dot(@recurrent_weight.data.transpose)
  dc = dc2_tmp * @forget
  [dx, dh, dc]
end

#forward(x, h, c) ⇒ `Object`

# File 'lib/dnn/core/rnn_layers.rb', line 238

def forward(x, h, c)
  @x = x
  @h = h
  @c = c
  num_nodes = h.shape[1]
  a = x.dot(@weight.data) + h.dot(@recurrent_weight.data)
  a += @bias.data if @bias

  @forget = @forget_sigmoid.forward(a[true, 0...num_nodes])
  @g = @g_tanh.forward(a[true, num_nodes...(num_nodes * 2)])
  @in = @in_sigmoid.forward(a[true, (num_nodes * 2)...(num_nodes * 3)])
  @out = @out_sigmoid.forward(a[true, (num_nodes * 3)..-1])

  c2 = @forget * c + @g * @in
  @tanh_c2 = @tanh.forward(c2)
  h2 = @out * @tanh_c2
  [h2, c2]
end

Class: DNN::Layers::LSTMDense

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(weight, recurrent_weight, bias) ⇒ LSTMDense

Instance Attribute Details

#trainable ⇒ Object

Instance Method Details

#backward(dh2, dc2) ⇒ Object

#forward(x, h, c) ⇒ Object

#initialize(weight, recurrent_weight, bias) ⇒ `LSTMDense`

#trainable ⇒ `Object`

#backward(dh2, dc2) ⇒ `Object`

#forward(x, h, c) ⇒ `Object`