Class: Cosensee::LineParser

Inherits:
Object
  • Object
show all
Defined in:
lib/cosensee/line_parser.rb

Overview

parse a line

Constant Summary collapse

INDENT_PATTERN =
/\A([\t ]*)(.*)\z/
QUOTE_PATTERN =
/\A(>)(.*)\z/
CODEBLOCK_PATTERN =
/\A(code:)(.+)\z/
COMMANDLINE_PATTERN =
/\A([$%]) (.+)\z/

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initializeLineParser

Returns a new instance of LineParser.



30
31
32
# File 'lib/cosensee/line_parser.rb', line 30

def initialize
  @bracket_parser = Cosensee::BracketParser.new
end

Class Method Details

.merge_blocks(lines) ⇒ Object



17
18
19
20
21
22
23
24
25
26
27
28
# File 'lib/cosensee/line_parser.rb', line 17

def self.merge_blocks(lines)
  prev_line = nil
  lines.each_with_object([]) do |line, result|
    if prev_line&.codeblock? && prev_line.indent_level < line.indent_level
      text = line.raw[prev_line.indent_level..]
      prev_line.append_text(text:, raw_line: line.raw)
    else
      result << line
      prev_line = line
    end
  end
end

.parse(line) ⇒ Object



13
14
15
# File 'lib/cosensee/line_parser.rb', line 13

def self.parse(line)
  new.parse(line)
end

Instance Method Details

#clean_elements(elements) ⇒ Object



252
253
254
255
256
257
258
259
260
261
262
263
264
# File 'lib/cosensee/line_parser.rb', line 252

def clean_elements(elements)
  fixed = []
  elements.each do |elem|
    last_elem = fixed.last
    if last_elem.is_a?(String) && elem.is_a?(String)
      fixed[-1] = "#{last_elem}#{elem}"
    else
      fixed << elem
    end
  end

  fixed.filter { |elem| !elem.nil? && elem != '' }
end

#done_parsing(line) ⇒ Object



243
244
245
246
247
248
249
250
# File 'lib/cosensee/line_parser.rb', line 243

def done_parsing(line)
  # If the line_content is Cosensee::Node::Quote, move content into it.
  if line.line_content.is_a?(Cosensee::Node::Quote)
    new_quote = line.line_content.replace_content(line.content)
    line.update(line_content: new_quote, content: [])
  end
  line.update(parsed: true)
end

#parse(line) ⇒ Object



34
35
36
37
38
39
40
41
42
43
44
45
# File 'lib/cosensee/line_parser.rb', line 34

def parse(line)
  parsed_line = ParsedLine.new(rest: line, raw: line)
  parsed_line
    .then { parse_indent(it) }
    .then { parse_whole_line(it) }
    .then { parse_code(it) }
    .then { parse_double_bracket(it) }
    .then { parse_bracket(it) }
    .then { parse_url(it) }
    .then { parse_hashtag(it) }
    .then { done_parsing(it) }
end

#parse_bracket(line) ⇒ Object



192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
# File 'lib/cosensee/line_parser.rb', line 192

def parse_bracket(line)
  return line if line.parsed?

  parsed = []
  stack = nil
  target_char = '[' # or "]"

  line.content.each do |elem|
    case elem
    when Cosensee::Node::Code, Cosensee::Node::DoubleBracket
      if target_char == '['
        parsed << elem
      else
        stack << elem
      end
    else # elem is String
      loop do
        n = elem.index(target_char)
        if n
          if target_char == '['
            parsed << elem[0, n]
            target_char = ']'
            stack = []
          else
            stack << elem[0, n]
            target_char = '['
            parsed << @bracket_parser.parse(stack)
            stack = nil
          end
          elem = elem[(n + 1)..]
        else
          if target_char == '['
            parsed << elem
          else
            stack << elem
          end
          break
        end
      end
    end
  end

  if stack
    # parsed += ['['] + stack
    parsed << '['
    parsed.concat(stack)
  end

  line.update(content: clean_elements(parsed))
end

#parse_code(line) ⇒ Object



83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
# File 'lib/cosensee/line_parser.rb', line 83

def parse_code(line)
  return line if line.parsed?

  parsed = []
  strs = line.split_rest_by('`')
  loop do
    str = strs.shift
    unless str
      return line.update(rest: nil,
                         content: parsed)
    end

    parsed << str

    str = strs.shift
    unless str
      line.update(rest: nil,
                  content: parsed)
      return line
    end

    if strs.empty?
      parsed.last.concat("`#{str}")
      return line.update(rest: nil,
                         content: parsed)
    else
      parsed << Node::Code.new(str, "`#{str}`")
    end
  end
end

#parse_double_bracket(line) ⇒ Object



166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
# File 'lib/cosensee/line_parser.rb', line 166

def parse_double_bracket(line)
  return line if line.parsed?

  parsed = []

  line.content.each do |elem|
    if elem.is_a?(String)
      loop do
        matched = elem.match(/\[\[(.+?)\]\]/)
        if matched
          parsed << matched.pre_match
          parsed << Cosensee::Node::DoubleBracket.new(content: [matched[1]], raw: matched[0])
          elem = matched.post_match
        else
          parsed << elem
          break # loop
        end
      end
    else
      parsed << elem
    end
  end

  line.update(content: clean_elements(parsed))
end

#parse_hashtag(line) ⇒ Object



114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
# File 'lib/cosensee/line_parser.rb', line 114

def parse_hashtag(line)
  return line if line.parsed?

  parsed = []

  line.content.each do |elem|
    if elem.is_a?(String)
      loop do
        matched = elem.match(/(^|\s)#(\S+)/)
        if matched
          parsed << "#{matched.pre_match}#{matched[1]}"
          parsed << Cosensee::Node::HashTag.new(content: matched[2], raw: "##{matched[2]}")
          elem = matched.post_match
        else
          parsed << elem
          break # loop
        end
      end
    else
      parsed << elem
    end
  end

  line.update(content: clean_elements(parsed))
end

#parse_indent(line) ⇒ Object



47
48
49
50
51
# File 'lib/cosensee/line_parser.rb', line 47

def parse_indent(line)
  matched = line.match(INDENT_PATTERN)
  ParsedLine.new(indent: Cosensee::Node::Indent.new(matched[1], matched[1]),
                 rest: matched[2], raw: line.raw)
end

#parse_url(line) ⇒ Object



140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
# File 'lib/cosensee/line_parser.rb', line 140

def parse_url(line)
  return line if line.parsed?

  parsed = []

  line.content.each do |elem|
    if elem.is_a?(String)
      loop do
        matched = elem.match(%r{(^|.*?)(https?://[^\s]+)})
        if matched
          parsed << "#{matched.pre_match}#{matched[1]}"
          parsed << Cosensee::Node::Link.new(matched[2], matched[2])
          elem = matched.post_match
        else
          parsed << elem
          break # loop
        end
      end
    else
      parsed << elem
    end
  end

  line.update(content: clean_elements(parsed))
end

#parse_whole_line(line) ⇒ Object



53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
# File 'lib/cosensee/line_parser.rb', line 53

def parse_whole_line(line)
  # parse quote
  matched = line.match(QUOTE_PATTERN)
  if matched
    line.update(rest: matched[2],
                line_content: Cosensee::Node::Quote.new(content: nil, raw: matched[0], mark: matched[1]))
    return line
  end

  # parse codeblock
  matched = line.match(CODEBLOCK_PATTERN)
  if matched
    return line.update(rest: nil,
                       line_content: Cosensee::Node::Codeblock.new(content: '', name: matched[2], raw: matched[0]),
                       parsed: true)
  end

  # parse command line
  matched = line.match(COMMANDLINE_PATTERN)
  if matched
    return line.update(rest: nil,
                       line_content: Cosensee::Node::CommandLine.new(content: matched[2],
                                                                     prompt: matched[1],
                                                                     raw: matched[0]),
                       parsed: true)
  end

  line
end