Class: Tensorflow::TensorData

Inherits:

Object

Object
Tensorflow::TensorData

show all

Extended by:: FFI::Library, Forwardable

Defined in:: lib/tensorflow/tensor_data.rb

Overview

Tensorflow expects client libraries to allocate memory for the data that a tensor wraps. When a tensor is released, it notifies the client via a callback that gives the client a chance to release the memory.

We don’t want to use a FFI::MemoryPointer because they are garbage collected. If the underlying data is freed before the tensor is released you get a GC (this can happen even if a Ruby tensor object keeps a reference to the pointer at GC time).

Thus this class creates its own memory and frees the memory only after being called bcak by tensorflow.

Constant Summary collapse

Deallocator = Store a callback as a class consstant (so it won’t be garbage collected ) that tensorflow will trigger when memory should be freed.

::FFI::Function.new(:void, [:pointer, :size_t, :pointer]) do |data, len, arg|
  ruby_xfree(data)
end

DTYPE_TO_NUMO_TYPE_MAP =

{bool:       Numo::Bit,
complex64:  Numo::SComplex,
complex128: Numo::DComplex,
double:     Numo::DFloat,
float:      Numo::SFloat,
int8:       Numo::Int8,
int16:      Numo::Int16,
int32:      Numo::Int32,
int64:      Numo::Int64,
uint8:      Numo::UInt8,
uint16:     Numo::UInt16,
uint32:     Numo::UInt32,
uint64:     Numo::UInt64}

NUMO_TYPE_TO_DTYPE_MAP =

DTYPE_TO_NUMO_TYPE_MAP.each_with_object(Hash.new) do |pair, hash|
  hash[pair.last] = pair.first
end

Instance Attribute Summary collapse

#byte_size ⇒ Object readonly

Returns the value of attribute byte_size.
#dtype ⇒ Object readonly

Returns the value of attribute dtype.
#pointer ⇒ Object readonly

Returns the value of attribute pointer.
#shape ⇒ Object readonly

Returns the value of attribute shape.

Class Method Summary collapse

Instance Method Summary collapse

#initialize(value, dtype: nil, shape: []) ⇒ TensorData constructor

A new instance of TensorData.
#read_array_of_complex128(count) ⇒ Object
#read_array_of_complex64(count) ⇒ Object
#read_array_of_string(count) ⇒ Object
#to_ptr ⇒ Object
#value ⇒ Object

def value result = case self.dtype when :float, :double, :int32, :uint8, :int16, :int8, :int64, :uint16, :uint32, :uint64 self.pointer.send(“read_array_of_#selfself.dtype”, self.count) when :bfloat16 byte_str = self.pointer.read_bytes(self.count * 2) self.count.times.map { |i| “#* i)..(2 * i + 1)]x00x00”.unpack1(“g”) } when :complex64 self.read_array_of_complex64(self.count) when :complex128 self.read_array_of_complex128(self.count) when :string self.read_array_of_string(self.count) when :bool self.pointer.read_array_of_int8(self.count) when :resource, :variant return self.data else raise “Unsupported tensor data type: #selfself.dtype” end.
#write_array_of_string(strings) ⇒ Object
#write_narray(new_value) ⇒ Object
#write_scalar(new_value) ⇒ Object

Constructor Details

#initialize(value, dtype: nil, shape: []) ⇒ `TensorData`

Returns a new instance of TensorData.

# File 'lib/tensorflow/tensor_data.rb', line 113

def initialize(value, dtype: nil, shape: [])
  @dtype = dtype || self.class.figure_dtype(value)
  @shape = shape
  case value
    when Numo::NArray
      self.write_narray(value)
    when Array
      raise(Error::InvalidArgumentError, "TensorData does not support Arrays. Please use a Numo::NArray")
    when Google::Protobuf::MessageExts
      encoded = value.class.encode(value)
      self.write_array_of_string([encoded])
    else
      self.write_scalar(value)
  end
end

Instance Attribute Details

#byte_size ⇒ `Object` (readonly)

Returns the value of attribute byte_size.



18
19
20

# File 'lib/tensorflow/tensor_data.rb', line 18

def byte_size
  @byte_size
end

#dtype ⇒ `Object` (readonly)

Returns the value of attribute dtype.



18
19
20

# File 'lib/tensorflow/tensor_data.rb', line 18

def dtype
  @dtype
end

#pointer ⇒ `Object` (readonly)

Returns the value of attribute pointer.



18
19
20

# File 'lib/tensorflow/tensor_data.rb', line 18

def pointer
  @pointer
end

#shape ⇒ `Object` (readonly)

Returns the value of attribute shape.



18
19
20

# File 'lib/tensorflow/tensor_data.rb', line 18

def shape
  @shape
end

Class Method Details

.figure_dtype(value) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 47

def self.figure_dtype(value)
  case value
    when Numo::RObject
      # Need to look at the first element to see what it is
      self.figure_dtype(value[0])
    when Numo::NArray
      NUMO_TYPE_TO_DTYPE_MAP[value.class]
    when Array
      self.figure_dtype(value.first)
    when Integer
      (value >= -2147483648 && value <= 2147483647) ? :int32 : :int64
    when Complex
      (value.real > -1.175494351e38 && value.real <	3.402823466e38) ? :complex64 : :complex128
    when Numeric
      (value > -1.175494351e38 && value <	3.402823466e38) ? :float : :double
    when String
      :string
    when TrueClass, FalseClass
      :bool
    when ::FFI::Pointer
      :pointer
    when Tensor
      value.dtype
    when Variable
      value.dtype
    when Graph::Operation
      nil
    when Eager::TensorHandle
      value.dtype
    when Google::Protobuf::MessageExts
      :string
    else
      raise(Error::InvalidArgumentError, "Unsupported type: #{value.class}")
  end
end

.from_pointer(pointer, byte_size, dtype, shape) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 104

def self.from_pointer(pointer, byte_size, dtype, shape)
  result = self.allocate
  result.instance_variable_set(:@pointer, pointer)
  result.instance_variable_set(:@byte_size, byte_size)
  result.instance_variable_set(:@dtype, dtype)
  result.instance_variable_set(:@shape, shape)
  result
end

.type_size(dtype) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 83

def self.type_size(dtype)
  case dtype
    when :complex64
      ::FFI.type_size(:float) * 2
    when :complex128
      ::FFI.type_size(:double) * 2
    else
      ::FFI.type_size(dtype)
  end
end

.value_with_shape(value, dtype, shape) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 94

def self.value_with_shape(value, dtype, shape)
  if shape && shape.size > 0
    dtype ||= self.figure_dtype(value)
    numo_klass = DTYPE_TO_NUMO_TYPE_MAP[dtype]
    numo_klass.new(shape).fill(value)
  else
    value
  end
end

Instance Method Details

#read_array_of_complex128(count) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 140

def read_array_of_complex128(count)
  values = self.read_array_of_double(2 * count)
  values.each_slice(2).map do |real, imaginary|
    Complex(real, imaginary)
  end
end

#read_array_of_complex64(count) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 133

def read_array_of_complex64(count)
  values = self.read_array_of_float(2 * count)
  values.each_slice(2).map do |real, imaginary|
    Complex(real, imaginary)
  end
end

#read_array_of_string(count) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 147

def read_array_of_string(count)
  # The start of the data section comes after the offset table
  start_offset_size = count * ::FFI.type_size(:int64)

  # Read in the string offsets
  offsets = self.pointer.read_array_of_uint64(count)

  offsets.map.with_index do |offset, index|
    src_bytes = (offsets[index + 1] || self.byte_size) - offset
    dst_ptr = ::FFI::MemoryPointer.new(:pointer)
    dst_len_ptr = ::FFI::MemoryPointer.new(:size_t)
    Status.check do |status|
      FFI.TF_StringDecode(self.pointer + start_offset_size + offset, src_bytes, dst_ptr, dst_len_ptr, status)
    end
    string_pointer = dst_ptr.read_pointer
    string_length = dst_len_ptr.read(:size_t)
    string_pointer.read_string(string_length)
  end
end

#to_ptr ⇒ `Object`



129
130
131

# File 'lib/tensorflow/tensor_data.rb', line 129

def to_ptr
  @pointer
end

#value ⇒ `Object`

def value

result = case self.dtype
          when :float, :double, :int32, :uint8, :int16, :int8, :int64, :uint16, :uint32, :uint64
            self.pointer.send("read_array_of_#{self.dtype}", self.count)
          when :bfloat16
            byte_str = self.pointer.read_bytes(self.count * 2)
            self.count.times.map { |i| "#{byte_str[(2 * i)..(2 * i + 1)]}\x00\x00".unpack1("g") }
          when :complex64
            self.read_array_of_complex64(self.count)
          when :complex128
            self.read_array_of_complex128(self.count)
          when :string
            self.read_array_of_string(self.count)
          when :bool
            self.pointer.read_array_of_int8(self.count)
          when :resource, :variant
            return self.data
          else
            raise "Unsupported tensor data type: #{self.dtype}"
        end

if self.count == 1
  result.first
else
  result
end

end

# File 'lib/tensorflow/tensor_data.rb', line 195

def value
  result = case self.dtype
             when :bfloat16
               byte_str = self.pointer.read_bytes(self.count * 2)
               self.count.times.map { |i| "#{byte_str[(2 * i)..(2 * i + 1)]}\x00\x00".unpack1("g") }
             when :string
               count = self.shape.reduce(1) {|dim, result| result *= dim}
               self.read_array_of_string(count)
             when :bool
               bytes = self.pointer.read_bytes(self.byte_size)
               int8 = if self.shape.empty?
                         Numo::Int8.from_binary(bytes)
                       else
                         Numo::Int8.from_binary(bytes, self.shape)
                       end
               int8.cast_to(Numo::Bit)
             else
               bytes = self.pointer.read_bytes(self.byte_size)
               numo_klass = DTYPE_TO_NUMO_TYPE_MAP[self.dtype]
               if self.shape.empty?
                 numo_klass.from_binary(bytes)
               else
                 numo_klass.from_binary(bytes, self.shape)
               end
           end

  if self.shape.empty?
    result[0]
  else
    result
  end
end

#write_array_of_string(strings) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 228

def write_array_of_string(strings)
  # The start of the data section comes after the offset table
  start_offset_size = strings.size * ::FFI.type_size(:int64)

  # Get the encoded sizes for each string
  encoded_sizes = strings.map do |string|
    FFI.TF_StringEncodedSize(string.bytesize)
  end

  # Now figure the offsets. Offsets are relative to the beginning of data section, not the beginning of the pointer.
  # Notice we skip the last string [0..-2] since its offset would be the end of the pointer
  offsets = [0]
  encoded_sizes[0..-2].each do |encoded_size|
    offsets << offsets.last + encoded_size
  end

  # Allocate the needed memory
  @byte_size = start_offset_size + encoded_sizes.sum
  @pointer = self.class.ruby_xmalloc(@byte_size)

  # Write the offsets
  self.pointer.write_array_of_uint64(offsets)

  # Write the strings
  strings.each_with_index do |string, index|
    offset = offsets[index]
    size = encoded_sizes[index]
    Status.check do |status|
      FFI.TF_StringEncode(string, string.bytesize, self.pointer + start_offset_size + offset, size, status)
    end
  end
end

#write_narray(new_value) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 261

def write_narray(new_value)
  @shape = new_value.shape

  case self.dtype
    when :string
      self.write_array_of_string(new_value.flatten.to_a)
    when :bool
      new_value = new_value.cast_to(Numo::Int8)
      @byte_size = new_value.byte_size
      @pointer = self.class.ruby_xmalloc(self.byte_size)
      self.pointer.write_bytes(new_value.to_binary)
    else
      if NUMO_TYPE_TO_DTYPE_MAP[new_value.class] != dtype
        # Cast the narray if necessary (say the user passed in float but we have a double array)
        new_value = new_value.cast_to(DTYPE_TO_NUMO_TYPE_MAP[dtype])
      end
      @byte_size = new_value.byte_size
      @pointer = self.class.ruby_xmalloc(@byte_size)
      self.pointer.write_bytes(new_value.to_binary)
  end
end

#write_scalar(new_value) ⇒ `Object`

# File 'lib/tensorflow/tensor_data.rb', line 283

def write_scalar(new_value)
  case self.dtype
    when :string
      self.write_array_of_string([new_value])
    when :resource, :variant
      return self
    else
      @byte_size = self.class.type_size(self.dtype)
      @pointer = self.class.ruby_xmalloc(@byte_size)
      case self.dtype
        when :float, :double, :int32, :uint8, :int16, :int8, :int64, :uint16, :uint32, :uint64
          self.pointer.send("write_#{self.dtype}", new_value)
        when :bfloat16
          byte_str = self.pointer.read_bytes(self.count * 2)
          self.count.times.map { |i| "#{byte_str[(2 * i)..(2 * i + 1)]}\x00\x00".unpack1("g") }
        when :complex64
          self.pointer.write_array_of_float([new_value.real, new_value.imaginary])
        when :complex128
          self.pointer.write_array_of_double([new_value.real, new_value.imaginary])
        when :bool
          self.pointer.write_int8(new_value ? 1 : 0)
        else
          raise "Unsupported tensor data type: #{self.dtype}"
      end
  end
end

Class: Tensorflow::TensorData

Overview

Constant Summary collapse

Instance Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(value, dtype: nil, shape: []) ⇒ TensorData

Instance Attribute Details

#byte_size ⇒ Object (readonly)

#dtype ⇒ Object (readonly)

#pointer ⇒ Object (readonly)

#shape ⇒ Object (readonly)

Class Method Details

.figure_dtype(value) ⇒ Object

.from_pointer(pointer, byte_size, dtype, shape) ⇒ Object

.type_size(dtype) ⇒ Object

.value_with_shape(value, dtype, shape) ⇒ Object

Instance Method Details

#read_array_of_complex128(count) ⇒ Object

#read_array_of_complex64(count) ⇒ Object

#read_array_of_string(count) ⇒ Object

#to_ptr ⇒ Object

#value ⇒ Object

#write_array_of_string(strings) ⇒ Object

#write_narray(new_value) ⇒ Object

#write_scalar(new_value) ⇒ Object