Class: DNN::Layers::GRUDense

Inherits:

Layer

Object
Layer
DNN::Layers::GRUDense

show all

Defined in:: lib/dnn/core/layers/rnn_layers.rb

Instance Attribute Summary collapse

#trainable ⇒ Object

Returns the value of attribute trainable.

Attributes inherited from Layer

#input_shape, #output_shape

Instance Method Summary collapse

#backward(dh2) ⇒ Object
#forward(x, h) ⇒ Object
#initialize(weight, recurrent_weight, bias) ⇒ GRUDense constructor

A new instance of GRUDense.

Methods inherited from Layer

#<<, #build, #built?, #call, call, #clean, #compute_output_shape, from_hash, #load_hash, #to_hash

Constructor Details

#initialize(weight, recurrent_weight, bias) ⇒ `GRUDense`

Returns a new instance of GRUDense.

# File 'lib/dnn/core/layers/rnn_layers.rb', line 371

def initialize(weight, recurrent_weight, bias)
  @weight = weight
  @recurrent_weight = recurrent_weight
  @bias = bias
  @update_sigmoid = Layers::Sigmoid.new
  @reset_sigmoid = Layers::Sigmoid.new
  @tanh = Layers::Tanh.new
  @trainable = true
end

Instance Attribute Details

#trainable ⇒ `Object`

Returns the value of attribute trainable.



369
370
371

# File 'lib/dnn/core/layers/rnn_layers.rb', line 369

def trainable
  @trainable
end

Instance Method Details

#backward(dh2) ⇒ `Object`

# File 'lib/dnn/core/layers/rnn_layers.rb', line 404

def backward(dh2)
  dtanh_h = @tanh.backward_node(dh2 * (1 - @update))
  dh = dh2 * @update

  if @trainable
    dweight_h = @x.transpose.dot(dtanh_h)
    dweight2_h = (@h * @reset).transpose.dot(dtanh_h)
    dbias_h = dtanh_h.sum(0) if @bias
  end
  dx = dtanh_h.dot(@weight_h.transpose)
  dh += dtanh_h.dot(@weight2_h.transpose) * @reset

  dreset = @reset_sigmoid.backward_node(dtanh_h.dot(@weight2_h.transpose) * @h)
  dupdate = @update_sigmoid.backward_node(dh2 * @h - dh2 * @tanh_h)
  da = Xumo::SFloat.hstack([dupdate, dreset])
  if @trainable
    dweight_a = @x.transpose.dot(da)
    dweight2_a = @h.transpose.dot(da)
    dbias_a = da.sum(0) if @bias
  end
  dx += da.dot(@weight_a.transpose)
  dh += da.dot(@weight2_a.transpose)

  if @trainable
    @weight.grad += Xumo::SFloat.hstack([dweight_a, dweight_h])
    @recurrent_weight.grad += Xumo::SFloat.hstack([dweight2_a, dweight2_h])
    @bias.grad += Xumo::SFloat.hstack([dbias_a, dbias_h]) if @bias
  end
  [dx, dh]
end

#forward(x, h) ⇒ `Object`

# File 'lib/dnn/core/layers/rnn_layers.rb', line 381

def forward(x, h)
  @x = x
  @h = h
  num_units = h.shape[1]
  @weight_a = @weight.data[true, 0...(num_units * 2)]
  @weight2_a = @recurrent_weight.data[true, 0...(num_units * 2)]
  a = x.dot(@weight_a) + h.dot(@weight2_a)
  a += @bias.data[0...(num_units * 2)] if @bias
  @update = @update_sigmoid.forward_node(a[true, 0...num_units])
  @reset = @reset_sigmoid.forward_node(a[true, num_units..-1])

  @weight_h = @weight.data[true, (num_units * 2)..-1]
  @weight2_h = @recurrent_weight.data[true, (num_units * 2)..-1]
  @tanh_h = if @bias
              bias_h = @bias.data[(num_units * 2)..-1]
              @tanh.forward_node(x.dot(@weight_h) + (h * @reset).dot(@weight2_h) + bias_h)
            else
              @tanh.forward_node(x.dot(@weight_h) + (h * @reset).dot(@weight2_h))
            end
  h2 = (1 - @update) * @tanh_h + @update * h
  h2
end

Class: DNN::Layers::GRUDense

Instance Attribute Summary collapse

Attributes inherited from Layer

Instance Method Summary collapse

Methods inherited from Layer

Constructor Details

#initialize(weight, recurrent_weight, bias) ⇒ GRUDense

Instance Attribute Details

#trainable ⇒ Object

Instance Method Details

#backward(dh2) ⇒ Object

#forward(x, h) ⇒ Object

#initialize(weight, recurrent_weight, bias) ⇒ `GRUDense`

#trainable ⇒ `Object`

#backward(dh2) ⇒ `Object`

#forward(x, h) ⇒ `Object`