Class: Gollum::Sanitization

Inherits:
Object
  • Object
show all
Defined in:
lib/gollum-lib/sanitization.rb

Overview

Encapsulate sanitization options.

This class does not yet support all options of Sanitize library. See github.com/rgrove/sanitize/.

Constant Summary collapse

ELEMENTS =

Default whitelisted elements.

[
    'a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
    'blockquote', 'br', 'button', 'caption', 'center', 'cite',
    'code', 'col', 'colgroup', 'dd', 'del', 'dfn', 'dir',
    'div', 'dl', 'dt', 'em', 'fieldset', 'font', 'form', 'h1',
    'h2', 'h3', 'h4', 'h5', 'h6', 'hr', 'i', 'img', 'input',
    'ins', 'kbd', 'label', 'legend', 'li', 'map', 'mark', 'menu',
    'ol', 'optgroup', 'option', 'p', 'pre', 'q', 's', 'samp',
    'select', 'small', 'span', 'strike', 'strong', 'sub',
    'sup', 'table', 'tbody', 'td', 'textarea', 'tfoot', 'th',
    'thead', 'tr', 'tt', 'u', 'ul', 'var'
].freeze
ATTRIBUTES =

Default whitelisted attributes.

{
    'a'   => ['href'],
    'img' => ['src'],
    :all  => ['abbr', 'accept', 'accept-charset',
              'accesskey', 'action', 'align', 'alt', 'axis',
              'border', 'cellpadding', 'cellspacing', 'char',
              'charoff', 'class', 'charset', 'checked', 'cite',
              'clear', 'cols', 'colspan', 'color',
              'compact', 'coords', 'datetime', 'dir',
              'disabled', 'enctype', 'for', 'frame',
              'headers', 'height', 'hreflang',
              'hspace', 'id', 'ismap', 'label', 'lang',
              'longdesc', 'maxlength', 'media', 'method',
              'multiple', 'name', 'nohref', 'noshade',
              'nowrap', 'prompt', 'readonly', 'rel', 'rev',
              'rows', 'rowspan', 'rules', 'scope',
              'selected', 'shape', 'size', 'span',
              'start', 'summary', 'tabindex', 'target',
              'title', 'type', 'usemap', 'valign', 'value',
              'vspace', 'width']
}.freeze
PROTOCOLS =

Default whitelisted protocols for URLs.

{
    'a'    => { 'href' => ['http', 'https', 'mailto', 'ftp', 'irc', 'apt', :relative] },
    'img'  => { 'src' => ['http', 'https', :relative] },
    'form' => { 'action' => ['http', 'https', :relative] }
}.freeze
ADD_ATTRIBUTES =
lambda do |env, node|
  if (add = env[:config][:add_attributes][node.name])
    add.each do |key, value|
      node[key] = value
    end
  end
end
REMOVE_CONTENTS =

Default elements whose contents will be removed in addition to the elements themselve

[
    'script',
    'style'
].freeze
TRANSFORMERS =

Default transformers to force @id attributes with ‘wiki-’ prefix

lambda do |env|
      node = env[:node]
      return if env[:is_whitelisted] || !node.element?
      prefix      = env[:config][:id_prefix]
      found_attrs = %w(id name).select do |key|
        if (value = node[key])
          node[key] = value.gsub(/\A(#{prefix})?/, prefix)
        end
      end
      if found_attrs.size > 0
        ADD_ATTRIBUTES.call(env, node)
        {}
      end
    end,
    lambda do |env|
      node = env[:node]
      return unless (value = node['href'])
      prefix       = env[:config][:id_prefix]
      node['href'] = value.gsub(/\A\#(#{prefix})?/, '#'+prefix)
      ADD_ATTRIBUTES.call(env, node)
      {}
    end
].freeze

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize {|_self| ... } ⇒ Sanitization

Returns a new instance of Sanitization.

Yields:

  • (_self)

Yield Parameters:



124
125
126
127
128
129
130
131
132
133
134
# File 'lib/gollum-lib/sanitization.rb', line 124

def initialize
  @elements        = ELEMENTS.dup
  @attributes      = ATTRIBUTES.dup
  @protocols       = PROTOCOLS.dup
  @transformers    = TRANSFORMERS.dup
  @add_attributes  = {}
  @remove_contents = REMOVE_CONTENTS.dup
  @allow_comments  = false
  @id_prefix       = ''
  yield self if block_given?
end

Instance Attribute Details

#add_attributesObject (readonly)

Gets a Hash describing HTML attributes that Sanitize should add. Default: {}



114
115
116
# File 'lib/gollum-lib/sanitization.rb', line 114

def add_attributes
  @add_attributes
end

#allow_comments=(value) ⇒ Object (writeonly)

Sets a boolean determining whether Sanitize allows HTML comments in the output. Default: false.



122
123
124
# File 'lib/gollum-lib/sanitization.rb', line 122

def allow_comments=(value)
  @allow_comments = value
end

#attributesObject (readonly)

Gets a Hash describing which attributes are allowed in which HTML elements. Default: ATTRIBUTES.



98
99
100
# File 'lib/gollum-lib/sanitization.rb', line 98

def attributes
  @attributes
end

#elementsObject (readonly)

Gets an Array of whitelisted HTML elements. Default: ELEMENTS.



94
95
96
# File 'lib/gollum-lib/sanitization.rb', line 94

def elements
  @elements
end

#id_prefixObject

Gets or sets a String prefix which is added to ID attributes. Default: ”



110
111
112
# File 'lib/gollum-lib/sanitization.rb', line 110

def id_prefix
  @id_prefix
end

#protocolsObject (readonly)

Gets a Hash describing which URI protocols are allowed in HTML attributes. Default: PROTOCOLS



102
103
104
# File 'lib/gollum-lib/sanitization.rb', line 102

def protocols
  @protocols
end

#remove_contentsObject (readonly)

Gets an Array of element names whose contents will be removed in addition to the elements themselves. Default: REMOVE_CONTENTS



118
119
120
# File 'lib/gollum-lib/sanitization.rb', line 118

def remove_contents
  @remove_contents
end

#transformersObject (readonly)

Gets a Hash describing which URI protocols are allowed in HTML attributes. Default: TRANSFORMERS



106
107
108
# File 'lib/gollum-lib/sanitization.rb', line 106

def transformers
  @transformers
end

Instance Method Details

#allow_comments?Boolean

Determines if Sanitize should allow HTML comments.

Returns True if comments are allowed, or False.

Returns:

  • (Boolean)


139
140
141
# File 'lib/gollum-lib/sanitization.rb', line 139

def allow_comments?
  !!@allow_comments
end

#history_sanitizationObject

Modifies the current Sanitization instance to sanitize older revisions of pages.

Returns a Sanitization instance.



147
148
149
150
151
# File 'lib/gollum-lib/sanitization.rb', line 147

def history_sanitization
  self.class.new do |sanitize|
    sanitize.add_attributes['a'] = { 'rel' => 'nofollow' }
  end
end

#to_hashObject

Builds a Hash of options suitable for Sanitize.clean.

Returns a Hash.



156
157
158
159
160
161
162
163
164
165
166
# File 'lib/gollum-lib/sanitization.rb', line 156

def to_hash
  { :elements        => elements,
    :attributes      => attributes,
    :protocols       => protocols,
    :add_attributes  => add_attributes,
    :remove_contents => remove_contents,
    :allow_comments  => allow_comments?,
    :transformers    => transformers,
    :id_prefix       => id_prefix
  }
end

#to_sanitizeObject

Builds a Sanitize instance from the current options.

Returns a Sanitize instance.



171
172
173
# File 'lib/gollum-lib/sanitization.rb', line 171

def to_sanitize
  Sanitize.new(to_hash)
end