Class: OdpsDatahub::Serializer
- Inherits:
-
Object
- Object
- OdpsDatahub::Serializer
- Defined in:
- lib/fluent/plugin/serialize/serializer.rb
Instance Method Summary collapse
- #encodeBool(value) ⇒ Object
- #encodeDataTime(value) ⇒ Object
- #encodeDouble(value) ⇒ Object
- #encodeFixed32(value) ⇒ Object
- #encodeFixed64(value) ⇒ Object
- #encodeFixedString(value) ⇒ Object
- #encodeSInt64(value) ⇒ Object
- #encodeString(value) ⇒ Object
- #encodeUInt32(value) ⇒ Object
- #serialize(upStream, recordList) ⇒ Object
- #writeTag(idx, type, stream) ⇒ Object
Instance Method Details
#encodeBool(value) ⇒ Object
32 33 34 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 32 def encodeBool(value) [value ? 1 : 0].pack('C') end |
#encodeDataTime(value) ⇒ Object
59 60 61 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 59 def encodeDataTime(value) self.encodeSInt64(value) end |
#encodeDouble(value) ⇒ Object
36 37 38 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 36 def encodeDouble(value) [value].pack('E') end |
#encodeFixed32(value) ⇒ Object
76 77 78 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 76 def encodeFixed32(value) [value].pack('V') end |
#encodeFixed64(value) ⇒ Object
71 72 73 74 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 71 def encodeFixed64(value) # we don't use 'Q' for pack/unpack. 'Q' is machine-dependent. [value & 0xffff_ffff, value >> 32].pack('VV') end |
#encodeFixedString(value) ⇒ Object
80 81 82 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 80 def encodeFixedString(value) [value].pack('V') end |
#encodeSInt64(value) ⇒ Object
40 41 42 43 44 45 46 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 40 def encodeSInt64(value) if value >= 0 ::Protobuf::Field::VarintField.encode(value << 1) else ::Protobuf::Field::VarintField.encode(~(value << 1)) end end |
#encodeString(value) ⇒ Object
63 64 65 66 67 68 69 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 63 def encodeString(value) value_to_encode = value.dup value_to_encode.encode!(::Protobuf::Field::StringField::ENCODING, :invalid => :replace, :undef => :replace, :replace => "") value_to_encode.force_encoding(::Protobuf::Field::BytesField::BYTES_ENCODING) string_bytes = ::Protobuf::Field::VarintField.encode(value_to_encode.size) string_bytes << value_to_encode end |
#encodeUInt32(value) ⇒ Object
48 49 50 51 52 53 54 55 56 57 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 48 def encodeUInt32(value) return [value].pack('C') if value < 128 bytes = [] until value == 0 bytes << (0x80 | (value & 0x7f)) value >>= 7 end bytes[-1] &= 0x7f bytes.pack('C*') end |
#serialize(upStream, recordList) ⇒ Object
89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 89 def serialize(upStream, recordList) crc32cPack = StringIO.new if recordList.is_a?Array recordList.each { |record| crc32cRecord = StringIO.new schema = OdpsTableSchema.new schema = record.getTableSchema schema.mCols.each { | col | cellValue = record.getValue(col.mIdx) if cellValue == nil next end crc32cRecord.write(encodeFixed32(col.mIdx + 1)) case col.mType when $ODPS_BIGINT crc32cRecord.write(encodeFixed64(cellValue)) writeTag(col.mIdx + 1, ::Protobuf::WireType::VARINT, upStream) upStream.write(encodeSInt64(cellValue)) when $ODPS_DOUBLE crc32cRecord.write(encodeDouble(cellValue)) writeTag(col.mIdx + 1, ::Protobuf::WireType::FIXED64, upStream) upStream.write(encodeDouble(cellValue)) when $ODPS_BOOLEAN crc32cRecord.write(encodeBool(cellValue)) writeTag(col.mIdx + 1, ::Protobuf::WireType::VARINT, upStream) upStream.write(encodeBool(cellValue)) when $ODPS_DATETIME crc32cRecord.write(encodeFixed64(cellValue)) writeTag(col.mIdx + 1, ::Protobuf::WireType::VARINT, upStream) upStream.write(encodeDataTime(cellValue)) when $ODPS_STRING crc32cRecord.write(cellValue) writeTag(col.mIdx + 1, ::Protobuf::WireType::LENGTH_DELIMITED, upStream) upStream.write(encodeString(cellValue)) when $ODPS_DECIMAL crc32cRecord.write(cellValue) writeTag(col.mIdx + 1, ::Protobuf::WireType::LENGTH_DELIMITED, upStream) upStream.write(encodeString(cellValue)) else raise OdpsDatahubException.new($INVALID_ARGUMENT, "invalid mType") end } recordCrc = CrcCalculator::calculate(crc32cRecord) writeTag($TUNNEL_END_RECORD, ::Protobuf::WireType::VARINT, upStream) upStream.write(encodeUInt32(recordCrc)) crc32cPack.write(encodeFixed32(recordCrc)) } writeTag($TUNNEL_META_COUNT, ::Protobuf::WireType::VARINT, upStream) upStream.write(encodeSInt64(recordList.size)) writeTag($TUNNEL_META_CHECKSUM, ::Protobuf::WireType::VARINT, upStream) upStream.write(encodeUInt32(CrcCalculator::calculate(crc32cPack))) else raise OdpsDatahubException.new($INVALID_ARGUMENT, "param must be a array") end end |
#writeTag(idx, type, stream) ⇒ Object
84 85 86 87 |
# File 'lib/fluent/plugin/serialize/serializer.rb', line 84 def writeTag(idx, type, stream) key = (idx << 3) | type stream << ::Protobuf::Field::VarintField.encode(key) end |