Class: Brief::Document::ContentExtractor

Inherits:
Object
  • Object
show all
Defined in:
lib/brief/document/content_extractor.rb

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(model_type, document) ⇒ ContentExtractor

Returns a new instance of ContentExtractor.



3
4
5
6
# File 'lib/brief/document/content_extractor.rb', line 3

def initialize(model_type, document)
  @model_type = model_type
  @document = document
end

Dynamic Method Handling

This class handles dynamic methods through the method_missing method

#method_missing(meth, *_args, &_block) ⇒ Object



31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
# File 'lib/brief/document/content_extractor.rb', line 31

def method_missing(meth, *_args, &_block)
  if settings = content_schema_attributes.fetch(meth, nil)
    if settings.args.length == 1 && settings.args.first.is_a?(String)
      selector = settings.args.first
      matches = document.css(selector)

      if matches.length > 1
        selector.match(/first-of-type/) ? matches.first.text : matches.map(&:text)
      else
        matches.first.try(:text)
      end
    elsif settings.args.first.to_s.match(/code/i) && (settings.args.last.serialize rescue nil)
      selector = settings.args.first
      opts = settings.args.last

      matches = document.css(selector)

      val = if matches.length > 1
        selector.match(/first-of-type/) ? matches.first.text : matches.map(&:text)
      else
        matches.first.try(:text)
      end

      if val && opts.serialize == :yaml
        return (YAML.load(val) rescue {}).to_mash
      end

      if val && opts.serialize == :json
        return (JSON.parse(val) rescue {}).to_mash
      end
    end
  end
end

Instance Attribute Details

#documentObject (readonly)

Returns the value of attribute document.



8
9
10
# File 'lib/brief/document/content_extractor.rb', line 8

def document
  @document
end

Instance Method Details

#content_schema_attributesObject



14
15
16
# File 'lib/brief/document/content_extractor.rb', line 14

def content_schema_attributes
  model_class.definition.content_schema.attributes
end

#extracted_content_dataObject



18
19
20
21
22
23
24
25
# File 'lib/brief/document/content_extractor.rb', line 18

def extracted_content_data
  me = self
  content_schema_attributes.keys.reduce({}.to_mash) do |memo, attr|
    val = me.send(attr) rescue nil
    memo[attr] = val if val
    memo
  end
end

#model_classObject



10
11
12
# File 'lib/brief/document/content_extractor.rb', line 10

def model_class
  document.model_class
end

#respond_to?(meth) ⇒ Boolean

Returns:

  • (Boolean)


27
28
29
# File 'lib/brief/document/content_extractor.rb', line 27

def respond_to?(meth)
  content_schema_attributes.key?(meth) || super
end