Class: Fdlint::Parser::HTML::HtmlParser

Inherits:

BaseParser

Object
BaseParser
Fdlint::Parser::HTML::HtmlParser

show all

Includes:: Helper::Logger, ParserVisitable

Defined in:: lib/fdlint/parser/html/html_parser.rb

Constant Summary collapse

TEXT =

/[^<]+/m

PROP_NAME =

%r/\w[-:\w]*/m

PROP_VALUE =

%r/'([^']*)'|"([^"]*)"|([^\s>]+)/m

PROP =

%r/#{PROP_NAME}\s*(?:=\s*#{PROP_VALUE})?/m

TAG_NAME =

/\w[^>\(\)\/\s]*/

TAG_START =

%r/<(#{TAG_NAME})/m

TAG_END =

%r/<\/#{TAG_NAME}\s*>/m

TAG =

%r/#{TAG_START}(\s+#{PROP})*\s*>/m

SELF_CLOSE_TAG =

%r/#{TAG_START}(\s+#{PROP})*\s*\/>/m

DTD =

/\s*<!(doctype)\s+(.*?)>/im

COMMENT =

/<!--(.*?)-->/m

Constants included from Helper::Logger

Helper::Logger::LEVELS

Instance Attribute Summary

Attributes inherited from BaseParser

#source

Class Method Summary collapse

.parse(src) {|doc| ... } ⇒ Object

Instance Method Summary collapse

Constructor Details

This class inherits a constructor from Fdlint::Parser::BaseParser

Class Method Details

.parse(src) {|doc| ... } ⇒ `Object`

Yields:

(doc)

# File 'lib/fdlint/parser/html/html_parser.rb', line 13

def self.parse(src, &block)
  parser = self.new(src)
  doc = parser.parse
  yield doc if block_given? 
  doc
end

Instance Method Details

#parse ⇒ `Object`



32
33
34

# File 'lib/fdlint/parser/html/html_parser.rb', line 32

def parse
  parse_doc
end

#parse_comment ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 63

def parse_comment
  scan COMMENT
  CommentElement.new(@scanner[1])
end

#parse_doc ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 36

def parse_doc
  debug { "parse doc" }
  ::Fdlint::Parser::HTML::Document.new( batch(:parse_element) )
end

#parse_dtd ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 57

def parse_dtd
  debug { "parse dtd" }
  node = scan(DTD)
  DTDElement.new(@scanner[2], @scanner[1], node.position)
end

#parse_element ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 41

def parse_element
  if @scanner.check(DTD) and !@dtd_checked
    # only one DTD for one document
    @dtd_checked = true
    parse_dtd
  elsif @scanner.check(COMMENT)
    parse_comment
  elsif @scanner.check(TAG_START)
    parse_tag
  elsif !text_end?
    parse_text_tag
  else
    parse_error('Invalid HTML struct')
  end
end

#parse_prop_name ⇒ `Object`



117
118
119

# File 'lib/fdlint/parser/html/html_parser.rb', line 117

def parse_prop_name
  scan PROP_NAME
end

#parse_prop_value ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 121

def parse_prop_value
  scan PROP_VALUE
  "#{@scanner[1]}#{@scanner[2]}#{@scanner[3]}"
end

#parse_properties ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 96

def parse_properties
  skip_empty
  props = []
  until prop_search_done? do
    prop = parse_property
    props << prop if prop
    skip_empty
  end
  props
end

#parse_property ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 107

def parse_property
  name = parse_prop_name
  if @scanner.check( /\s*=/ )
    skip /[=]/
    sep = @scanner.check(/['"]/)
    value = parse_prop_value
  end
  Property.new name, value, sep
end

#parse_tag ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 84

def parse_tag
  if @scanner.check DTD
    parse_dtd_tag
  elsif @scanner.check SELF_CLOSE_TAG
    parse_self_ending_tag
  elsif @scanner.check TAG
    parse_normal_tag
  else
    parse_error('Invalid HTML struct')
  end
end

#parse_text_tag ⇒ `Object`

# File 'lib/fdlint/parser/html/html_parser.rb', line 68

def parse_text_tag
  text = ''
  pos  = scanner_pos
  until text_end? do
    text << '<' if @scanner.skip(/</)
    text << "#{@scanner.scan(TEXT)}"

    # TODO: make this detection a rule
    parse_warn "'#{$~}' not escaped" if text =~ /<|>/ && !@parsing_script
  end
  TextElement.new( text ).tap do |text|
    text.scopes   = scopes.dup
    text.position = pos
  end
end

Class: Fdlint::Parser::HTML::HtmlParser

Constant Summary collapse

Constants included from Helper::Logger

Instance Attribute Summary

Attributes inherited from BaseParser

Class Method Summary collapse

Instance Method Summary collapse

Methods included from Helper::Logger

Methods included from ParserVisitable

Methods inherited from BaseParser

Constructor Details

Class Method Details

.parse(src) {|doc| ... } ⇒ Object

Instance Method Details

#parse ⇒ Object

#parse_comment ⇒ Object

#parse_doc ⇒ Object

#parse_dtd ⇒ Object

#parse_element ⇒ Object

#parse_prop_name ⇒ Object

#parse_prop_value ⇒ Object

#parse_properties ⇒ Object

#parse_property ⇒ Object

#parse_tag ⇒ Object

#parse_text_tag ⇒ Object