Module: VibeZstd

Defined in:: lib/vibe_zstd.rb,
lib/vibe_zstd/version.rb,
lib/vibe_zstd/constants.rb,
ext/vibe_zstd/vibe_zstd.c

Defined Under Namespace

Modules: DictAttachPref, Format, LiteralCompressionMode, ResetDirective, Strategy, ThreadLocal Classes: CCtx, CDict, CompressWriter, DCtx, DDict, DecompressReader, Error

Constant Summary collapse

VERSION =

"1.0.1"

Class Method Summary collapse

.compress(data, **options) ⇒ Object

Convenience method for one-off compression Supports all CCtx#compress options: level, dict, pledged_size.
.compress_bound(size) ⇒ Object

VibeZstd.compress_bound(size).
.decompress(data, **options) ⇒ Object

Convenience method for one-off decompression Supports all DCtx#decompress options: dict, initial_capacity.
.default_compression_level ⇒ Object (also: default_level)
.dict_header_size(dict_data) ⇒ Object

VibeZstd.dict_header_size(dict_data).
.each_skippable_frame(data) ⇒ Object

Iterate over all skippable frames in the data Yields [content, magic_variant, offset] for each skippable frame.
.finalize_dictionary(*args) ⇒ Object

For large datasets, consider using a representative subset of samples.
.find_frame_compressed_size(data) ⇒ Object
.frame_content_size(data) ⇒ Object

Get the decompressed content size from a compressed frame Returns nil if size is unknown or data is invalid.
.get_dict_id(dict_data) ⇒ Object

VibeZstd.get_dict_id(dict_data).
.get_dict_id_from_frame(data) ⇒ Object

VibeZstd.get_dict_id_from_frame(data).
.max_compression_level ⇒ Object (also: max_level)
.min_compression_level ⇒ Object (also: min_level)
.read_skippable_frame(data) ⇒ Object
.skippable_frame?(data) ⇒ Boolean
.train_dict(*args) ⇒ Object

For large datasets, consider training on a representative subset to reduce memory footprint.
.train_dict_cover(*args) ⇒ Object

For large datasets, consider training on a representative subset to reduce memory footprint.
.train_dict_fast_cover(*args) ⇒ Object

For large datasets, consider training on a representative subset to reduce memory footprint.
.version_number ⇒ Object

Module-level version and compression level functions.
.version_string ⇒ Object
.write_skippable_frame(*args) ⇒ Object

Class Method Details

.compress(data, **options) ⇒ `Object`

Convenience method for one-off compression Supports all CCtx#compress options: level, dict, pledged_size

# File 'lib/vibe_zstd.rb', line 12

def self.compress(data, **options)
  cctx = CCtx.new
  cctx.compress(data, **options)
end

.compress_bound(size) ⇒ `Object`

VibeZstd.compress_bound(size)

# File 'ext/vibe_zstd/frames.c', line 5

static VALUE
vibe_zstd_compress_bound(VALUE self, VALUE size) {
    size_t src_size = NUM2SIZET(size);
    size_t bound = ZSTD_compressBound(src_size);
    return SIZET2NUM(bound);
}

.decompress(data, **options) ⇒ `Object`

Convenience method for one-off decompression Supports all DCtx#decompress options: dict, initial_capacity

# File 'lib/vibe_zstd.rb', line 19

def self.decompress(data, **options)
  dctx = DCtx.new
  dctx.decompress(data, **options)
end

.default_compression_level ⇒ `Object` Also known as: default_level

# File 'ext/vibe_zstd/vibe_zstd.c', line 243

static VALUE
vibe_zstd_default_c_level(VALUE self) {
    (void)self;
    return INT2NUM(ZSTD_defaultCLevel());
}

.dict_header_size(dict_data) ⇒ `Object`

VibeZstd.dict_header_size(dict_data)

# File 'ext/vibe_zstd/dict.c', line 529

static VALUE
vibe_zstd_dict_header_size(VALUE self, VALUE dict_data) {
    StringValue(dict_data);
    size_t header_size = ZDICT_getDictHeaderSize(RSTRING_PTR(dict_data), RSTRING_LEN(dict_data));

    // Check for errors
    if (ZDICT_isError(header_size)) {
        rb_raise(rb_eRuntimeError, "Failed to get dictionary header size: %s", ZDICT_getErrorName(header_size));
    }

    return SIZET2NUM(header_size);
}

.each_skippable_frame(data) ⇒ `Object`

Iterate over all skippable frames in the data Yields [content, magic_variant, offset] for each skippable frame

# File 'lib/vibe_zstd.rb', line 32

def self.each_skippable_frame(data)
  return enum_for(:each_skippable_frame, data) unless block_given?

  offset = 0
  while offset < data.bytesize
    frame_data = data.byteslice(offset..-1)
    frame_size = find_frame_compressed_size(frame_data)

    # Defense: Prevent infinite loop on malformed data
    # A valid frame must have non-zero size (at minimum: frame header)
    if frame_size <= 0
      raise Error, "Invalid frame: zero or negative size at offset #{offset}"
    end

    if skippable_frame?(frame_data)
      content, magic_variant = read_skippable_frame(frame_data)
      yield content, magic_variant, offset
    end

    offset += frame_size
  end
end

.finalize_dictionary(*args) ⇒ `Object`

For large datasets, consider using a representative subset of samples.

# File 'ext/vibe_zstd/dict.c', line 433

static VALUE
vibe_zstd_finalize_dictionary(int argc, VALUE* argv, VALUE self) {
    VALUE options;
    rb_scan_args(argc, argv, ":", &options);

    // Layer 1: Validate inputs BEFORE any allocation (fail-fast)
    if (NIL_P(options)) {
        rb_raise(rb_eArgError, "finalize_dictionary requires keyword arguments");
    }

    // Get required parameters
    VALUE content_val = rb_hash_aref(options, ID2SYM(rb_intern("content")));
    VALUE samples_val = rb_hash_aref(options, ID2SYM(rb_intern("samples")));
    VALUE max_size_val = rb_hash_aref(options, ID2SYM(rb_intern("max_size")));

    if (NIL_P(content_val)) {
        rb_raise(rb_eArgError, "content: parameter is required");
    }
    if (NIL_P(samples_val)) {
        rb_raise(rb_eArgError, "samples: parameter is required");
    }
    if (NIL_P(max_size_val)) {
        rb_raise(rb_eArgError, "max_size: parameter is required");
    }

    // Validate types early
    StringValue(content_val);
    Check_Type(samples_val, T_ARRAY);
    size_t max_size = NUM2SIZET(max_size_val);

    long num_samples = RARRAY_LEN(samples_val);
    if (num_samples == 0) {
        rb_raise(rb_eArgError, "samples array cannot be empty");
    }

    // Validate all samples are strings and calculate sizes BEFORE allocating
    size_t total_samples_size = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples_val, i);
        StringValue(sample);  // Validate type early - may raise TypeError
        total_samples_size += RSTRING_LEN(sample);
    }

    // Get optional parameters
    VALUE compression_level_val = rb_hash_aref(options, ID2SYM(rb_intern("compression_level")));
    VALUE dict_id_val = rb_hash_aref(options, ID2SYM(rb_intern("dict_id")));

    // Setup ZDICT_params_t
    ZDICT_params_t params;
    memset(&params, 0, sizeof(params));
    params.compressionLevel = NIL_P(compression_level_val) ? 0 : NUM2INT(compression_level_val);
    params.dictID = NIL_P(dict_id_val) ? 0 : NUM2UINT(dict_id_val);
    params.notificationLevel = 0;

    // Layer 2: Allocate late - only after validation passes
    dict_training_resources resources = {NULL, NULL, NULL};
    resources.sample_sizes = ALLOC_N(size_t, num_samples);
    resources.samples_buffer = ALLOC_N(char, total_samples_size);
    resources.dict_buffer = ALLOC_N(char, max_size);

    // Layer 3: Use rb_ensure for guaranteed cleanup (safety net)
    // Build samples buffer - we already validated, so just copy
    size_t offset = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples_val, i);
        size_t sample_len = RSTRING_LEN(sample);
        resources.sample_sizes[i] = sample_len;
        memcpy(resources.samples_buffer + offset, RSTRING_PTR(sample), sample_len);
        offset += sample_len;
    }

    // Finalize the dictionary
    size_t dict_size = ZDICT_finalizeDictionary(
        resources.dict_buffer, max_size,
        RSTRING_PTR(content_val), RSTRING_LEN(content_val),
        resources.samples_buffer, resources.sample_sizes, (unsigned)num_samples,
        params
    );

    // Check for errors
    if (ZDICT_isError(dict_size)) {
        dict_training_cleanup((VALUE)&resources);
        rb_raise(rb_eRuntimeError, "Dictionary finalization failed: %s", ZDICT_getErrorName(dict_size));
    }

    // Create Ruby string with the finalized dictionary
    VALUE dict_string = rb_str_new(resources.dict_buffer, dict_size);

    // Clean up all resources
    dict_training_cleanup((VALUE)&resources);

    return dict_string;
}

.find_frame_compressed_size(data) ⇒ `Object`

# File 'ext/vibe_zstd/frames.c', line 108

static VALUE
vibe_zstd_find_frame_compressed_size(VALUE self, VALUE data) {
    (void)self;
    StringValue(data);

    // Returns compressed size of first complete frame (including header/checksum)
    // Useful for splitting concatenated frames in multi-frame archives
    size_t frame_size = ZSTD_findFrameCompressedSize(RSTRING_PTR(data), RSTRING_LEN(data));

    if (ZSTD_isError(frame_size)) {
        rb_raise(rb_eRuntimeError, "Failed to find frame size: %s", ZSTD_getErrorName(frame_size));
    }

    return SIZET2NUM(frame_size);
}

.frame_content_size(data) ⇒ `Object`

Get the decompressed content size from a compressed frame Returns nil if size is unknown or data is invalid



26
27
28

# File 'lib/vibe_zstd.rb', line 26

def self.frame_content_size(data)
  DCtx.frame_content_size(data)
end

.get_dict_id(dict_data) ⇒ `Object`

VibeZstd.get_dict_id(dict_data)

# File 'ext/vibe_zstd/dict.c', line 412

static VALUE
vibe_zstd_get_dict_id(VALUE self, VALUE dict_data) {
    StringValue(dict_data);
    unsigned dict_id = ZDICT_getDictID(RSTRING_PTR(dict_data), RSTRING_LEN(dict_data));
    return UINT2NUM(dict_id);
}

.get_dict_id_from_frame(data) ⇒ `Object`

VibeZstd.get_dict_id_from_frame(data)

# File 'ext/vibe_zstd/dict.c', line 421

static VALUE
vibe_zstd_get_dict_id_from_frame(VALUE self, VALUE data) {
    StringValue(data);
    unsigned dict_id = ZSTD_getDictID_fromFrame(RSTRING_PTR(data), RSTRING_LEN(data));
    return UINT2NUM(dict_id);
}

.max_compression_level ⇒ `Object` Also known as: max_level

# File 'ext/vibe_zstd/vibe_zstd.c', line 237

static VALUE
vibe_zstd_max_c_level(VALUE self) {
    (void)self;
    return INT2NUM(ZSTD_maxCLevel());
}

.min_compression_level ⇒ `Object` Also known as: min_level

# File 'ext/vibe_zstd/vibe_zstd.c', line 231

static VALUE
vibe_zstd_min_c_level(VALUE self) {
    (void)self;
    return INT2NUM(ZSTD_minCLevel());
}

.read_skippable_frame(data) ⇒ `Object`

# File 'ext/vibe_zstd/frames.c', line 64

static VALUE
vibe_zstd_read_skippable_frame(VALUE self, VALUE data) {
    (void)self;
    StringValue(data);

    if (!ZSTD_isSkippableFrame(RSTRING_PTR(data), RSTRING_LEN(data))) {
        rb_raise(rb_eArgError, "data is not a skippable frame (%zu bytes provided)", RSTRING_LEN(data));
    }

    const char* src = RSTRING_PTR(data);
    size_t src_size = RSTRING_LEN(data);

    // Content size is in bytes 4-7 (little-endian uint32)
    if (src_size < 8) {
        rb_raise(rb_eArgError, "skippable frame too small (%zu bytes, minimum 8 bytes required)", src_size);
    }

    uint32_t content_size;
    memcpy(&content_size, src + 4, 4);

    VALUE result = rb_str_buf_new(content_size);
    unsigned magic_variant;

    size_t bytes_read = ZSTD_readSkippableFrame(
        RSTRING_PTR(result),
        content_size,
        &magic_variant,
        src,
        src_size
    );

    if (ZSTD_isError(bytes_read)) {
        rb_raise(rb_eRuntimeError, "Failed to read skippable frame: %s", ZSTD_getErrorName(bytes_read));
    }

    rb_str_set_len(result, bytes_read);

    // Return [content, magic_variant]
    VALUE result_ary = rb_ary_new_capa(2);
    rb_ary_push(result_ary, result);
    rb_ary_push(result_ary, UINT2NUM(magic_variant));
    return result_ary;
}

.skippable_frame?(data) ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/vibe_zstd/frames.c', line 12

static VALUE
vibe_zstd_skippable_frame_p(VALUE self, VALUE data) {
    (void)self;
    StringValue(data);
    unsigned result = ZSTD_isSkippableFrame(RSTRING_PTR(data), RSTRING_LEN(data));
    return result ? Qtrue : Qfalse;
}

.train_dict(*args) ⇒ `Object`

For large datasets, consider training on a representative subset to reduce memory footprint.

# File 'ext/vibe_zstd/dict.c', line 133

static VALUE
vibe_zstd_train_dict(int argc, VALUE* argv, VALUE self) {
    VALUE samples, options;
    rb_scan_args(argc, argv, "1:", &samples, &options);

    // Layer 1: Validate inputs BEFORE any allocation (fail-fast)
    Check_Type(samples, T_ARRAY);
    long num_samples = RARRAY_LEN(samples);

    if (num_samples == 0) {
        rb_raise(rb_eArgError, "samples array cannot be empty");
    }

    // Validate all samples are strings and calculate sizes BEFORE allocating
    size_t total_samples_size = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples, i);
        StringValue(sample);  // Validate type early - may raise TypeError
        total_samples_size += RSTRING_LEN(sample);
    }

    // Parse options
    VALUE max_dict_size_val = Qnil;
    if (!NIL_P(options)) {
        max_dict_size_val = rb_hash_aref(options, ID2SYM(rb_intern("max_dict_size")));
    }

    // Default max dictionary size is 112KB (zstd default)
    size_t max_dict_size = NIL_P(max_dict_size_val) ? (112 * 1024) : NUM2SIZET(max_dict_size_val);

    // Layer 2: Allocate late - only after validation passes
    dict_training_resources resources = {NULL, NULL, NULL};
    resources.sample_sizes = ALLOC_N(size_t, num_samples);
    resources.samples_buffer = ALLOC_N(char, total_samples_size);
    resources.dict_buffer = ALLOC_N(char, max_dict_size);

    // Layer 3: Use rb_ensure for guaranteed cleanup (safety net)
    // Build samples buffer - we already validated, so just copy
    size_t offset = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples, i);
        size_t sample_len = RSTRING_LEN(sample);
        resources.sample_sizes[i] = sample_len;
        memcpy(resources.samples_buffer + offset, RSTRING_PTR(sample), sample_len);
        offset += sample_len;
    }

    // Train the dictionary
    size_t dict_size = ZDICT_trainFromBuffer(
        resources.dict_buffer, max_dict_size,
        resources.samples_buffer, resources.sample_sizes, (unsigned)num_samples
    );

    // Check for errors
    if (ZDICT_isError(dict_size)) {
        dict_training_cleanup((VALUE)&resources);
        rb_raise(rb_eRuntimeError, "Dictionary training failed: %s", ZDICT_getErrorName(dict_size));
    }

    // Create Ruby string with the trained dictionary
    VALUE dict_string = rb_str_new(resources.dict_buffer, dict_size);

    // Clean up all resources
    dict_training_cleanup((VALUE)&resources);

    return dict_string;
}

.train_dict_cover(*args) ⇒ `Object`

For large datasets, consider training on a representative subset to reduce memory footprint.

# File 'ext/vibe_zstd/dict.c', line 205

static VALUE
vibe_zstd_train_dict_cover(int argc, VALUE* argv, VALUE self) {
    VALUE samples, options;
    rb_scan_args(argc, argv, "1:", &samples, &options);

    // Layer 1: Validate inputs BEFORE any allocation (fail-fast)
    Check_Type(samples, T_ARRAY);
    long num_samples = RARRAY_LEN(samples);

    if (num_samples == 0) {
        rb_raise(rb_eArgError, "samples array cannot be empty");
    }

    // Validate all samples are strings and calculate sizes BEFORE allocating
    size_t total_samples_size = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples, i);
        StringValue(sample);  // Validate type early - may raise TypeError
        total_samples_size += RSTRING_LEN(sample);
    }

    // Initialize COVER parameters with defaults
    ZDICT_cover_params_t params;
    memset(&params, 0, sizeof(params));
    params.splitPoint = 1.0;  // Default split point

    // Parse options
    if (!NIL_P(options)) {
        VALUE v;

        v = rb_hash_aref(options, ID2SYM(rb_intern("k")));
        if (!NIL_P(v)) params.k = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("d")));
        if (!NIL_P(v)) params.d = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("steps")));
        if (!NIL_P(v)) params.steps = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("split_point")));
        if (!NIL_P(v)) params.splitPoint = NUM2DBL(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("shrink_dict")));
        if (!NIL_P(v)) params.shrinkDict = RTEST(v) ? 1 : 0;

        v = rb_hash_aref(options, ID2SYM(rb_intern("shrink_dict_max_regression")));
        if (!NIL_P(v)) params.shrinkDictMaxRegression = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("nb_threads")));
        if (!NIL_P(v)) params.nbThreads = NUM2UINT(v);
    }

    // Get max_dict_size (default 112KB)
    VALUE max_dict_size_val = Qnil;
    if (!NIL_P(options)) {
        max_dict_size_val = rb_hash_aref(options, ID2SYM(rb_intern("max_dict_size")));
    }
    size_t max_dict_size = NIL_P(max_dict_size_val) ? (112 * 1024) : NUM2SIZET(max_dict_size_val);
    params.zParams.compressionLevel = 0;  // Use default compression level

    // Layer 2: Allocate late - only after validation passes
    dict_training_resources resources = {NULL, NULL, NULL};
    resources.sample_sizes = ALLOC_N(size_t, num_samples);
    resources.samples_buffer = ALLOC_N(char, total_samples_size);
    resources.dict_buffer = ALLOC_N(char, max_dict_size);

    // Layer 3: Use rb_ensure for guaranteed cleanup (safety net)
    // Build samples buffer - we already validated, so just copy
    size_t offset = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples, i);
        size_t sample_len = RSTRING_LEN(sample);
        resources.sample_sizes[i] = sample_len;
        memcpy(resources.samples_buffer + offset, RSTRING_PTR(sample), sample_len);
        offset += sample_len;
    }

    // Train the dictionary using COVER algorithm
    size_t dict_size = ZDICT_trainFromBuffer_cover(
        resources.dict_buffer, max_dict_size,
        resources.samples_buffer, resources.sample_sizes, (unsigned)num_samples,
        params
    );

    // Check for errors
    if (ZDICT_isError(dict_size)) {
        dict_training_cleanup((VALUE)&resources);
        rb_raise(rb_eRuntimeError, "Dictionary training failed: %s", ZDICT_getErrorName(dict_size));
    }

    // Create Ruby string with the trained dictionary
    VALUE dict_string = rb_str_new(resources.dict_buffer, dict_size);

    // Clean up all resources
    dict_training_cleanup((VALUE)&resources);

    return dict_string;
}

.train_dict_fast_cover(*args) ⇒ `Object`

For large datasets, consider training on a representative subset to reduce memory footprint.

# File 'ext/vibe_zstd/dict.c', line 308

static VALUE
vibe_zstd_train_dict_fast_cover(int argc, VALUE* argv, VALUE self) {
    VALUE samples, options;
    rb_scan_args(argc, argv, "1:", &samples, &options);

    // Layer 1: Validate inputs BEFORE any allocation (fail-fast)
    Check_Type(samples, T_ARRAY);
    long num_samples = RARRAY_LEN(samples);

    if (num_samples == 0) {
        rb_raise(rb_eArgError, "samples array cannot be empty");
    }

    // Validate all samples are strings and calculate sizes BEFORE allocating
    size_t total_samples_size = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples, i);
        StringValue(sample);  // Validate type early - may raise TypeError
        total_samples_size += RSTRING_LEN(sample);
    }

    // Initialize COVER parameters with defaults
    ZDICT_fastCover_params_t params;
    memset(&params, 0, sizeof(params));
    params.splitPoint = 1.0;  // Default split point

    // Parse options
    if (!NIL_P(options)) {
        VALUE v;

        v = rb_hash_aref(options, ID2SYM(rb_intern("k")));
        if (!NIL_P(v)) params.k = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("d")));
        if (!NIL_P(v)) params.d = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("f")));
        if (!NIL_P(v)) params.f = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("split_point")));
        if (!NIL_P(v)) params.splitPoint = NUM2DBL(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("accel")));
        if (!NIL_P(v)) params.accel = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("shrink_dict")));
        if (!NIL_P(v)) params.shrinkDict = RTEST(v) ? 1 : 0;

        v = rb_hash_aref(options, ID2SYM(rb_intern("shrink_dict_max_regression")));
        if (!NIL_P(v)) params.shrinkDictMaxRegression = NUM2UINT(v);

        v = rb_hash_aref(options, ID2SYM(rb_intern("nb_threads")));
        if (!NIL_P(v)) params.nbThreads = NUM2UINT(v);
    }

    // Get max_dict_size (default 112KB)
    VALUE max_dict_size_val = Qnil;
    if (!NIL_P(options)) {
        max_dict_size_val = rb_hash_aref(options, ID2SYM(rb_intern("max_dict_size")));
    }
    size_t max_dict_size = NIL_P(max_dict_size_val) ? (112 * 1024) : NUM2SIZET(max_dict_size_val);
    params.zParams.compressionLevel = 0;  // Use default compression level

    // Layer 2: Allocate late - only after validation passes
    dict_training_resources resources = {NULL, NULL, NULL};
    resources.sample_sizes = ALLOC_N(size_t, num_samples);
    resources.samples_buffer = ALLOC_N(char, total_samples_size);
    resources.dict_buffer = ALLOC_N(char, max_dict_size);

    // Layer 3: Use rb_ensure for guaranteed cleanup (safety net)
    // Build samples buffer - we already validated, so just copy
    size_t offset = 0;
    for (long i = 0; i < num_samples; i++) {
        VALUE sample = rb_ary_entry(samples, i);
        size_t sample_len = RSTRING_LEN(sample);
        resources.sample_sizes[i] = sample_len;
        memcpy(resources.samples_buffer + offset, RSTRING_PTR(sample), sample_len);
        offset += sample_len;
    }

    // Train the dictionary using fast COVER algorithm
    size_t dict_size = ZDICT_trainFromBuffer_fastCover(
        resources.dict_buffer, max_dict_size,
        resources.samples_buffer, resources.sample_sizes, (unsigned)num_samples,
        params
    );

    // Check for errors
    if (ZDICT_isError(dict_size)) {
        dict_training_cleanup((VALUE)&resources);
        rb_raise(rb_eRuntimeError, "Dictionary training failed: %s", ZDICT_getErrorName(dict_size));
    }

    // Create Ruby string with the trained dictionary
    VALUE dict_string = rb_str_new(resources.dict_buffer, dict_size);

    // Clean up all resources
    dict_training_cleanup((VALUE)&resources);

    return dict_string;
}

.version_number ⇒ `Object`

Module-level version and compression level functions

# File 'ext/vibe_zstd/vibe_zstd.c', line 219

static VALUE
vibe_zstd_version_number(VALUE self) {
    (void)self;
    return UINT2NUM(ZSTD_versionNumber());
}

.version_string ⇒ `Object`

# File 'ext/vibe_zstd/vibe_zstd.c', line 225

static VALUE
vibe_zstd_version_string(VALUE self) {
    (void)self;
    return rb_str_new_cstr(ZSTD_versionString());
}

.write_skippable_frame(*args) ⇒ `Object`

# File 'ext/vibe_zstd/frames.c', line 20

static VALUE
vibe_zstd_write_skippable_frame(int argc, VALUE *argv, VALUE self) {
    (void)self;
    VALUE data, options;
    rb_scan_args(argc, argv, "11", &data, &options);

    StringValue(data);

    unsigned magic_variant = 0;  // Default to 0
    if (!NIL_P(options)) {
        Check_Type(options, T_HASH);
        VALUE magic_num = rb_hash_aref(options, ID2SYM(rb_intern("magic_number")));
        if (!NIL_P(magic_num)) {
            magic_variant = NUM2UINT(magic_num);
            if (magic_variant > 15) {
                rb_raise(rb_eArgError, "magic_number %u out of bounds (valid: 0-15)", magic_variant);
            }
        }
    }

    const char* src = RSTRING_PTR(data);
    size_t src_size = RSTRING_LEN(data);

    // Skippable frame structure: 4-byte magic (0x184D2A5X) + 4-byte size + content
    // Decoders skip these frames, allowing custom metadata/padding
    size_t frame_size = 8 + src_size;
    VALUE result = rb_str_buf_new(frame_size);

    size_t written = ZSTD_writeSkippableFrame(
        RSTRING_PTR(result),
        frame_size,
        src,
        src_size,
        magic_variant
    );

    if (ZSTD_isError(written)) {
        rb_raise(rb_eRuntimeError, "Failed to write skippable frame: %s", ZSTD_getErrorName(written));
    }

    rb_str_set_len(result, written);
    return result;
}

Module: VibeZstd

Defined Under Namespace

Constant Summary collapse

Class Method Summary collapse

Class Method Details

.compress(data, **options) ⇒ Object

.compress_bound(size) ⇒ Object

.decompress(data, **options) ⇒ Object

.default_compression_level ⇒ Object Also known as: default_level

.dict_header_size(dict_data) ⇒ Object

.each_skippable_frame(data) ⇒ Object

.finalize_dictionary(*args) ⇒ Object

.find_frame_compressed_size(data) ⇒ Object

.frame_content_size(data) ⇒ Object

.get_dict_id(dict_data) ⇒ Object

.get_dict_id_from_frame(data) ⇒ Object

.max_compression_level ⇒ Object Also known as: max_level

.min_compression_level ⇒ Object Also known as: min_level

.read_skippable_frame(data) ⇒ Object

.skippable_frame?(data) ⇒ Boolean

.train_dict(*args) ⇒ Object

.train_dict_cover(*args) ⇒ Object

.train_dict_fast_cover(*args) ⇒ Object

.version_number ⇒ Object

.version_string ⇒ Object

.write_skippable_frame(*args) ⇒ Object

.compress(data, **options) ⇒ `Object`

.compress_bound(size) ⇒ `Object`

.decompress(data, **options) ⇒ `Object`

.default_compression_level ⇒ `Object` Also known as: default_level

.dict_header_size(dict_data) ⇒ `Object`

.each_skippable_frame(data) ⇒ `Object`

.finalize_dictionary(*args) ⇒ `Object`

.find_frame_compressed_size(data) ⇒ `Object`

.frame_content_size(data) ⇒ `Object`

.get_dict_id(dict_data) ⇒ `Object`

.get_dict_id_from_frame(data) ⇒ `Object`

.max_compression_level ⇒ `Object` Also known as: max_level

.min_compression_level ⇒ `Object` Also known as: min_level

.read_skippable_frame(data) ⇒ `Object`

.skippable_frame?(data) ⇒ `Boolean`

.train_dict(*args) ⇒ `Object`

.train_dict_cover(*args) ⇒ `Object`

.train_dict_fast_cover(*args) ⇒ `Object`

.version_number ⇒ `Object`

.version_string ⇒ `Object`

.write_skippable_frame(*args) ⇒ `Object`