Class: Liquid::C::Tokenizer

Inherits:

Object

Object
Liquid::C::Tokenizer

show all

Defined in:: lib/liquid/c.rb,
ext/liquid_c/tokenizer.c

Constant Summary collapse

MAX_SOURCE_BYTE_SIZE =

(1 << 24) - 1

Instance Method Summary collapse

#bug_compatible_whitespace_trimming! ⇒ Object

Temporary to test rollout of the fix for this bug.
#for_liquid_tag ⇒ Object
#initialize(source, start_line_number, for_liquid_tag) ⇒ Object constructor
#line_number ⇒ Object
#shift ⇒ Object

Constructor Details

#initialize(source, start_line_number, for_liquid_tag) ⇒ `Object`

# File 'ext/liquid_c/tokenizer.c', line 46

static VALUE tokenizer_initialize_method(VALUE self, VALUE source, VALUE start_line_number, VALUE for_liquid_tag)
{
    tokenizer_t *tokenizer;

    Check_Type(source, T_STRING);
    check_utf8_encoding(source, "source");

#define MAX_SOURCE_CODE_BYTES ((1 << 24) - 1)
    if (RSTRING_LEN(source) > MAX_SOURCE_CODE_BYTES) {
        rb_enc_raise(utf8_encoding, rb_eArgError, "Source too large, max %d bytes", MAX_SOURCE_CODE_BYTES);
    }
#undef MAX_SOURCE_CODE_BYTES

    Tokenizer_Get_Struct(self, tokenizer);
    source = rb_str_dup_frozen(source);
    tokenizer->source = source;
    tokenizer->cursor = RSTRING_PTR(source);
    tokenizer->cursor_end = tokenizer->cursor + RSTRING_LEN(source);
    tokenizer->lstrip_flag = false;
    // tokenizer->line_number keeps track of the current line number or it is 0
    // to indicate that line numbers aren't being calculated
    tokenizer->line_number = FIX2UINT(start_line_number);
    tokenizer->for_liquid_tag = RTEST(for_liquid_tag);
    return Qnil;
}

Instance Method Details

#bug_compatible_whitespace_trimming! ⇒ `Object`

Temporary to test rollout of the fix for this bug

# File 'ext/liquid_c/tokenizer.c', line 275

static VALUE tokenizer_bug_compatible_whitespace_trimming(VALUE self) {
    tokenizer_t *tokenizer;
    Tokenizer_Get_Struct(self, tokenizer);

    tokenizer->bug_compatible_whitespace_trimming = true;
    return Qnil;
}

#for_liquid_tag ⇒ `Object`

# File 'ext/liquid_c/tokenizer.c', line 265

static VALUE tokenizer_for_liquid_tag_method(VALUE self)
{
    tokenizer_t *tokenizer;
    Tokenizer_Get_Struct(self, tokenizer);

    return tokenizer->for_liquid_tag ? Qtrue : Qfalse;
}

#line_number ⇒ `Object`

# File 'ext/liquid_c/tokenizer.c', line 254

static VALUE tokenizer_line_number_method(VALUE self)
{
    tokenizer_t *tokenizer;
    Tokenizer_Get_Struct(self, tokenizer);

    if (tokenizer->line_number == 0)
        return Qnil;

    return UINT2NUM(tokenizer->line_number);
}

#shift ⇒ `Object`

# File 'ext/liquid_c/tokenizer.c', line 223

static VALUE tokenizer_shift_method(VALUE self)
{
    tokenizer_t *tokenizer;
    Tokenizer_Get_Struct(self, tokenizer);

    token_t token;
    tokenizer_next(tokenizer, &token);
    if (!token.type)
        return Qnil;

    // When sent back to Ruby, tokens are the raw string including whitespace
    // and tag delimiters. It should be possible to reconstruct the exact
    // template from the tokens.
    return rb_enc_str_new(token.str_full, token.len_full, utf8_encoding);
}

Class: Liquid::C::Tokenizer

Constant Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(source, start_line_number, for_liquid_tag) ⇒ Object

Instance Method Details

#bug_compatible_whitespace_trimming! ⇒ Object

#for_liquid_tag ⇒ Object

#line_number ⇒ Object

#shift ⇒ Object

#initialize(source, start_line_number, for_liquid_tag) ⇒ `Object`

#bug_compatible_whitespace_trimming! ⇒ `Object`

#for_liquid_tag ⇒ `Object`

#line_number ⇒ `Object`

#shift ⇒ `Object`