Class: XRT::Parser

Inherits:
Object
  • Object
show all
Defined in:
lib/xrt/parser.rb

Instance Method Summary collapse

Constructor Details

#initialize(source = '') ⇒ Parser

Returns a new instance of Parser.



5
6
7
# File 'lib/xrt/parser.rb', line 5

def initialize(source='')
  @source = source
end

Instance Method Details

#documentObject



9
10
11
12
13
14
15
16
# File 'lib/xrt/parser.rb', line 9

def document
  doc = XRT::Statement::Document.new

  tokenized = self.tokens

  parse_contents(tokenized, doc)
  doc
end

#new_statement(content) ⇒ Object



108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
# File 'lib/xrt/parser.rb', line 108

def new_statement content
  syntax = XRT::Syntax.new

  block_level = syntax.block_level content

  if block_level == 1
    XRT::Statement::ControlBlock.new content
  elsif block_level == -1
    XRT::Statement::End.new content
  elsif syntax.block? content
    XRT::Statement::Directive.new content
  elsif syntax.tag_start? content
    XRT::Statement::Tag.new content
  elsif syntax.tag_end? content
    XRT::Statement::TagEnd.new content
  elsif syntax.whitespace? content
    XRT::Statement::Whitespace.new content
  else
    XRT::Statement::Text.new content
  end
end

#parse_contents(tokenized, node, in_raw_text = false) ⇒ Object

read tokens from tokenized tokens push contents to (container) node returns parsed container node return when tokenized is empty, or node is closed



22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
# File 'lib/xrt/parser.rb', line 22

def parse_contents(tokenized, node, in_raw_text = false)
  if node.kind_of?(XRT::Statement::TagPair) && node.children[0].tag_raw_text_element?
    parse_raw_text_element(tokenized, node)
    return
  end

  while tokenized.length > 0
    statement = new_statement(tokenized.shift)

    unless in_raw_text
      case statement
      when XRT::Statement::Tag
        parse_contents(tokenized, statement)
        if statement.tag_opening?
          statement = XRT::Statement::TagPair.new(statement)
          parse_contents(tokenized, statement, in_raw_text)
          node << statement
          next
        elsif statement.tag_closing?
          statement = XRT::Statement::TagPairEnd.new(statement)
          node << statement
          break
        else
          node << statement
          next
        end
      end
    end

    if in_raw_text
      if statement.kind_of?(XRT::Statement::Tag) || statement.kind_of?(XRT::Statement::TagEnd)
        statement = XRT::Statement::Text.new(statement.content)
      end
    end

    case statement
    when XRT::Statement::ControlBlock
      parse_contents(tokenized, statement, in_raw_text)
      node << statement
    when XRT::Statement::End
      node << statement
      break
    else
      node << statement
    end
  end

  node
end

#parse_raw_text_element(tokenized, node) ⇒ Object

parse all statements as texts and whitespaces until </script> will appear.



73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
# File 'lib/xrt/parser.rb', line 73

def parse_raw_text_element(tokenized, node)
  syntax = XRT::Syntax.new
  tag_name = node.children[0].tag_name

  while tokenized.length > 0
    maybe_close_tag = new_statement(tokenized[0])
    maybe_closing_content = new_statement(tokenized[1])

    if maybe_close_tag.kind_of?(XRT::Statement::Tag)
      maybe_close_tag << maybe_closing_content
      if maybe_close_tag.tag_closing? && maybe_close_tag.tag_name == tag_name
        close_tag = new_statement(tokenized.shift)
        parse_contents(tokenized, close_tag)
        statement = XRT::Statement::TagPairEnd.new(close_tag)
        node << statement
        return
      end
    end

    content = tokenized.shift
    block_level = syntax.block_level content
    if block_level == 1
      statement = XRT::Statement::ControlBlock.new content
      parse_contents(tokenized, statement, true)
      node << statement
    elsif syntax.block? content
      node << XRT::Statement::Directive.new(content)
    elsif syntax.whitespace? content
      node << XRT::Statement::Whitespace.new(content)
    else
      node << XRT::Statement::Text.new(content)
    end
  end
end

#read_directive(source) ⇒ Object



164
165
166
167
168
169
170
171
172
173
# File 'lib/xrt/parser.rb', line 164

def read_directive source
  return nil unless source[0...2] == '[%'

  buffer = ''
  while source[0...2] != '%]'
    buffer << source.slice!(0)
  end
  buffer << source.slice!(0, 2)
  buffer
end

#read_tag_end(source) ⇒ Object



199
200
201
202
# File 'lib/xrt/parser.rb', line 199

def read_tag_end source
  return nil unless source[0] == '>'
  source.slice!(0)
end

#read_tag_start(source) ⇒ Object



194
195
196
197
# File 'lib/xrt/parser.rb', line 194

def read_tag_start source
  return nil unless source[0] == '<'
  source.slice!(0)
end

#read_text(source) ⇒ Object



175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
# File 'lib/xrt/parser.rb', line 175

def read_text source
  return nil if source[0...2] == '[%'
  return nil if source[0] == '<'
  return nil if source[0] == '>'

  buffer = ''
  while true
    return buffer if source[0...2] == '[%'
    return buffer if source[0] == '<'
    return buffer if source[0] == '>'
    break if source.length < 2
    buffer << source.slice!(0)
  end

  buffer << source.slice!(0, source.length)

  buffer
end

#split_whitespace(text) ⇒ Object



151
152
153
154
155
156
157
158
159
160
161
162
# File 'lib/xrt/parser.rb', line 151

def split_whitespace(text)
  prefix, suffix=nil
  text.sub!(/\A(\s+)/) {|matched|
    prefix = matched
    ''
  }
  text.sub!(/(\s+)\Z/) {|matched|
    suffix = matched
    ''
  }
  [prefix, text, suffix].compact.delete_if{|s| s.empty?}
end

#tokensObject



130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
# File 'lib/xrt/parser.rb', line 130

def tokens
  reading = @source.dup
  result = []

  while reading.length > 0
    if got = read_directive(reading)
      result << got
    elsif got = read_tag_start(reading)
      result << got
    elsif got = read_tag_end(reading)
      result << got
    elsif got = read_text(reading)
      result.concat(split_whitespace(got))
    else
      raise "failed to parse #{@source}"
    end
  end

  result
end