Class: Weskit::WML::Parsers::KPEG

Inherits:
Object
  • Object
show all
Defined in:
lib/weskit/wml/parsers/kpeg.rb

Defined Under Namespace

Classes: MemoEntry, ParseError, RuleInfo

Instance Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(str, debug = false) ⇒ KPEG

This is distinct from setup_parser so that a standalone parser can redefine #initialize and still have access to the proper parser setup code.



8
9
10
# File 'lib/weskit/wml/parsers/kpeg.rb', line 8

def initialize(str, debug=false)
  setup_parser(str, debug)
end

Instance Attribute Details

#failed_ruleObject (readonly)

Returns the value of attribute failed_rule.



149
150
151
# File 'lib/weskit/wml/parsers/kpeg.rb', line 149

def failed_rule
  @failed_rule
end

#failing_rule_offsetObject (readonly)

Returns the value of attribute failing_rule_offset.



28
29
30
# File 'lib/weskit/wml/parsers/kpeg.rb', line 28

def failing_rule_offset
  @failing_rule_offset
end

#posObject

Returns the value of attribute pos.



29
30
31
# File 'lib/weskit/wml/parsers/kpeg.rb', line 29

def pos
  @pos
end

#resultObject

Returns the value of attribute result.



29
30
31
# File 'lib/weskit/wml/parsers/kpeg.rb', line 29

def result
  @result
end

#stringObject (readonly)

Returns the value of attribute string.



27
28
29
# File 'lib/weskit/wml/parsers/kpeg.rb', line 27

def string
  @string
end

Class Method Details

.rule_info(name, rendered) ⇒ Object



349
350
351
# File 'lib/weskit/wml/parsers/kpeg.rb', line 349

def self.rule_info(name, rendered)
  RuleInfo.new(name, rendered)
end

Instance Method Details

#apply(rule) ⇒ Object



284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
# File 'lib/weskit/wml/parsers/kpeg.rb', line 284

def apply(rule)
  if m = @memoizations[rule][@pos]
    @pos = m.pos
    if !m.set
      m.left_rec = true
      return nil
    end

    @result = m.result

    return m.ans
  else
    m = MemoEntry.new(nil, @pos)
    @memoizations[rule][@pos] = m
    start_pos = @pos

    ans = __send__ rule

    lr = m.left_rec

    m.move! ans, @pos, @result

    # Don't bother trying to grow the left recursion
    # if it's failing straight away (thus there is no seed)
    if ans and lr
      return grow_lr(rule, nil, start_pos, m)
    else
      return ans
    end

    return ans
  end
end

#apply_with_args(rule, *args) ⇒ Object



249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
# File 'lib/weskit/wml/parsers/kpeg.rb', line 249

def apply_with_args(rule, *args)
  memo_key = [rule, args]
  if m = @memoizations[memo_key][@pos]
    @pos = m.pos
    if !m.set
      m.left_rec = true
      return nil
    end

    @result = m.result

    return m.ans
  else
    m = MemoEntry.new(nil, @pos)
    @memoizations[memo_key][@pos] = m
    start_pos = @pos

    ans = __send__ rule, *args

    lr = m.left_rec

    m.move! ans, @pos, @result

    # Don't bother trying to grow the left recursion
    # if it's failing straight away (thus there is no seed)
    if ans and lr
      return grow_lr(rule, args, start_pos, m)
    else
      return ans
    end

    return ans
  end
end

#current_column(target = pos) ⇒ Object



32
33
34
35
36
37
38
# File 'lib/weskit/wml/parsers/kpeg.rb', line 32

def current_column(target=pos)
  if c = string.rindex("\n", target-1)
    return target - c - 1
  end

  target + 1
end

#current_line(target = pos) ⇒ Object



40
41
42
43
44
45
46
47
48
49
50
51
# File 'lib/weskit/wml/parsers/kpeg.rb', line 40

def current_line(target=pos)
  cur_offset = 0
  cur_line = 0

  string.each_line do |line|
    cur_line += 1
    cur_offset += line.size
    return cur_line if cur_offset >= target
  end

  -1
end

#external_invoke(other, rule, *args) ⇒ Object



228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
# File 'lib/weskit/wml/parsers/kpeg.rb', line 228

def external_invoke(other, rule, *args)
  old_pos = @pos
  old_string = @string

  @pos = other.pos
  @string = other.string

  begin
    if val = __send__(rule, *args)
      other.pos = @pos
      other.result = @result
    else
      other.set_failed_rule "#{self.class}##{rule}"
    end
    val
  ensure
    @pos = old_pos
    @string = old_string
  end
end

#failure_caretObject



86
87
88
89
90
91
92
# File 'lib/weskit/wml/parsers/kpeg.rb', line 86

def failure_caret
  l = current_line @failing_rule_offset
  c = current_column @failing_rule_offset

  line = lines[l-1]
  "#{line}\n#{' ' * (c - 1)}^"
end

#failure_characterObject



94
95
96
97
98
# File 'lib/weskit/wml/parsers/kpeg.rb', line 94

def failure_character
  l = current_line @failing_rule_offset
  c = current_column @failing_rule_offset
  lines[l-1][c-1, 1]
end

#failure_infoObject



74
75
76
77
78
79
80
81
82
83
84
# File 'lib/weskit/wml/parsers/kpeg.rb', line 74

def failure_info
  l = current_line @failing_rule_offset
  c = current_column @failing_rule_offset

  if @failed_rule.kind_of? Symbol
    info = self.class::Rules[@failed_rule]
    "line #{l}, column #{c}: failed rule '#{info.name}' = '#{info.rendered}'"
  else
    "line #{l}, column #{c}: failed rule '#{@failed_rule}'"
  end
end

#failure_onelineObject



100
101
102
103
104
105
106
107
108
109
110
111
112
# File 'lib/weskit/wml/parsers/kpeg.rb', line 100

def failure_oneline
  l = current_line @failing_rule_offset
  c = current_column @failing_rule_offset

  char = lines[l-1][c-1, 1]

  if @failed_rule.kind_of? Symbol
    info = self.class::Rules[@failed_rule]
    "@#{l}:#{c} failed rule '#{info.name}', got '#{char}'"
  else
    "@#{l}:#{c} failed rule '#{@failed_rule}', got '#{char}'"
  end
end

#get_byteObject



172
173
174
175
176
177
178
179
180
# File 'lib/weskit/wml/parsers/kpeg.rb', line 172

def get_byte
  if @pos >= @string.size
    return nil
  end

  s = @string.getbyte @pos
  @pos += 1
  s
end

#get_text(start) ⇒ Object



61
62
63
# File 'lib/weskit/wml/parsers/kpeg.rb', line 61

def get_text(start)
  @string[start..@pos-1]
end

#grow_lr(rule, args, start_pos, m) ⇒ Object



318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
# File 'lib/weskit/wml/parsers/kpeg.rb', line 318

def grow_lr(rule, args, start_pos, m)
  while true
    @pos = start_pos
    @result = m.result

    if args
      ans = __send__ rule, *args
    else
      ans = __send__ rule
    end
    return nil unless ans

    break if @pos <= m.pos

    m.move! ans, @pos, @result
  end

  @result = m.result
  @pos = m.pos
  return m.ans
end

#linesObject



53
54
55
56
57
# File 'lib/weskit/wml/parsers/kpeg.rb', line 53

def lines
  lines = []
  string.each_line { |l| lines << l }
  lines
end

#match_string(str) ⇒ Object



151
152
153
154
155
156
157
158
159
# File 'lib/weskit/wml/parsers/kpeg.rb', line 151

def match_string(str)
  len = str.size
  if @string[pos,len] == str
    @pos += len
    return str
  end

  return nil
end

#parse(rule = nil) ⇒ Object



193
194
195
196
197
198
199
200
201
202
203
204
205
# File 'lib/weskit/wml/parsers/kpeg.rb', line 193

def parse(rule=nil)
  # We invoke the rules indirectly via apply
  # instead of by just calling them as methods because
  # if the rules use left recursion, apply needs to
  # manage that.

  if !rule
    apply(:_root)
  else
    method = rule.gsub("-","_hyphen_")
    apply :"_#{method}"
  end
end

#raise_errorObject

Raises:



117
118
119
# File 'lib/weskit/wml/parsers/kpeg.rb', line 117

def raise_error
  raise ParseError, failure_oneline
end

#scan(reg) ⇒ Object



161
162
163
164
165
166
167
168
169
# File 'lib/weskit/wml/parsers/kpeg.rb', line 161

def scan(reg)
  if m = reg.match(@string[@pos..-1])
    width = m.end(0)
    @pos += width
    return true
  end

  return nil
end

#set_failed_rule(name) ⇒ Object



142
143
144
145
146
147
# File 'lib/weskit/wml/parsers/kpeg.rb', line 142

def set_failed_rule(name)
  if @pos > @failing_rule_offset
    @failed_rule = name
    @failing_rule_offset = @pos
  end
end

#setup_parser(str, debug = false) ⇒ Object

Prepares for parsing str. If you define a custom initialize you must call this method before #parse



16
17
18
19
20
21
22
23
24
25
# File 'lib/weskit/wml/parsers/kpeg.rb', line 16

def setup_parser(str, debug=false)
  @string = str
  @pos = 0
  @memoizations = Hash.new { |h,k| h[k] = {} }
  @result = nil
  @failed_rule = nil
  @failing_rule_offset = -1

  setup_foreign_grammar
end

#show_error(io = STDOUT) ⇒ Object



121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
# File 'lib/weskit/wml/parsers/kpeg.rb', line 121

def show_error(io=STDOUT)
  error_pos = @failing_rule_offset
  line_no = current_line(error_pos)
  col_no = current_column(error_pos)

  io.puts "On line #{line_no}, column #{col_no}:"

  if @failed_rule.kind_of? Symbol
    info = self.class::Rules[@failed_rule]
    io.puts "Failed to match '#{info.rendered}' (rule '#{info.name}')"
  else
    io.puts "Failed to match rule '#{@failed_rule}'"
  end

  io.puts "Got: #{string[error_pos,1].inspect}"
  line = lines[line_no-1]
  io.puts "=> #{line}"
  io.print(" " * (col_no + 3))
  io.puts "^"
end

#show_posObject



65
66
67
68
69
70
71
72
# File 'lib/weskit/wml/parsers/kpeg.rb', line 65

def show_pos
  width = 10
  if @pos < width
    "#{@pos} (\"#{@string[0,@pos]}\" @ \"#{@string[@pos,width]}\")"
  else
    "#{@pos} (\"... #{@string[@pos - width, width]}\" @ \"#{@string[@pos,width]}\")"
  end
end