Class: Nokogiri::CSS::Parser

Inherits:
Racc::Parser
  • Object
show all
Defined in:
lib/nokogiri/css/parser.rb,
lib/nokogiri/css/parser_extras.rb

Constant Summary collapse

Racc_arg =
[
racc_action_table,
racc_action_check,
racc_action_default,
racc_action_pointer,
racc_goto_table,
racc_goto_check,
racc_goto_default,
racc_goto_pointer,
racc_nt_base,
racc_reduce_table,
racc_token_table,
racc_shift_n,
racc_reduce_n,
racc_use_result_var ]
Racc_token_to_s_table =
[
"$end",
"error",
"FUNCTION",
"INCLUDES",
"DASHMATCH",
"LBRACE",
"HASH",
"PLUS",
"GREATER",
"S",
"STRING",
"IDENT",
"COMMA",
"NUMBER",
"PREFIXMATCH",
"SUFFIXMATCH",
"SUBSTRINGMATCH",
"TILDE",
"NOT_EQUAL",
"SLASH",
"DOUBLESLASH",
"NOT",
"EQUAL",
"RPAREN",
"LSQUARE",
"RSQUARE",
"HAS",
"\".\"",
"\"*\"",
"\"|\"",
"\":\"",
"$start",
"selector",
"simple_selector_1toN",
"prefixless_combinator_selector",
"optional_S",
"combinator",
"simple_selector",
"element_name",
"hcap_0toN",
"function",
"pseudo",
"attrib",
"hcap_1toN",
"class",
"namespaced_ident",
"namespace",
"attrib_name",
"attrib_val_0or1",
"expr",
"nth",
"attribute_id",
"negation",
"eql_incl_dash",
"negation_arg" ]
Racc_debug_parser =
false

Class Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(namespaces = {}) ⇒ Parser

Create a new CSS parser with respect to namespaces


54
55
56
57
58
# File 'lib/nokogiri/css/parser_extras.rb', line 54

def initialize namespaces = {}
  @tokenizer  = Tokenizer.new
  @namespaces = namespaces
  super()
end

Class Attribute Details

.cache_onObject Also known as: cache_on?

Turn on CSS parse caching


12
13
14
# File 'lib/nokogiri/css/parser_extras.rb', line 12

def cache_on
  @cache_on
end

Class Method Details

.[](string) ⇒ Object

Get the css selector in string from the cache


17
18
19
20
# File 'lib/nokogiri/css/parser_extras.rb', line 17

def [] string
  return unless @cache_on
  @mutex.synchronize { @cache[string] }
end

.[]=(string, value) ⇒ Object

Set the css selector in string in the cache to value


23
24
25
26
# File 'lib/nokogiri/css/parser_extras.rb', line 23

def []= string, value
  return value unless @cache_on
  @mutex.synchronize { @cache[string] = value }
end

.clear_cacheObject

Clear the cache


29
30
31
# File 'lib/nokogiri/css/parser_extras.rb', line 29

def clear_cache
  @mutex.synchronize { @cache = {} }
end

.parse(selector) ⇒ Object

Parse this CSS selector in selector. Returns an AST.


43
44
45
46
47
48
49
50
# File 'lib/nokogiri/css/parser_extras.rb', line 43

def parse selector
  @warned ||= false
  unless @warned
    $stderr.puts('Nokogiri::CSS::Parser.parse is deprecated, call Nokogiri::CSS.parse(), this will be removed August 1st or version 1.4.0 (whichever is first)')
    @warned = true
  end
  new.parse selector
end

.without_cache(&block) ⇒ Object

Execute block without cache


34
35
36
37
38
39
# File 'lib/nokogiri/css/parser_extras.rb', line 34

def without_cache &block
  tmp = @cache_on
  @cache_on = false
  block.call
  @cache_on = tmp
end

Instance Method Details

#_reduce_1(val, _values, result) ⇒ Object

reduce 0 omitted


334
335
336
337
338
# File 'lib/nokogiri/css/parser.rb', line 334

def _reduce_1(val, _values, result)
        result = [val.first, val.last].flatten
      
    result
end

#_reduce_11(val, _values, result) ⇒ Object

reduce 10 omitted


387
388
389
390
391
# File 'lib/nokogiri/css/parser.rb', line 387

def _reduce_11(val, _values, result)
        result = Node.new(:CONDITIONAL_SELECTOR, val)
      
    result
end

#_reduce_12(val, _values, result) ⇒ Object


393
394
395
396
397
# File 'lib/nokogiri/css/parser.rb', line 393

def _reduce_12(val, _values, result)
        result = Node.new(:CONDITIONAL_SELECTOR, val)
      
    result
end

#_reduce_13(val, _values, result) ⇒ Object


399
400
401
402
403
404
405
# File 'lib/nokogiri/css/parser.rb', line 399

def _reduce_13(val, _values, result)
        result = Node.new(:CONDITIONAL_SELECTOR,
          [Node.new(:ELEMENT_NAME, ['*']), val.first]
        )
      
    result
end

#_reduce_14(val, _values, result) ⇒ Object


407
408
409
410
411
# File 'lib/nokogiri/css/parser.rb', line 407

def _reduce_14(val, _values, result)
        result = Node.new(val.first, [nil, val.last])
      
    result
end

#_reduce_15(val, _values, result) ⇒ Object


413
414
415
416
417
# File 'lib/nokogiri/css/parser.rb', line 413

def _reduce_15(val, _values, result)
        result = Node.new(val[1], [val.first, val.last])
      
    result
end

#_reduce_16(val, _values, result) ⇒ Object


419
420
421
422
423
# File 'lib/nokogiri/css/parser.rb', line 419

def _reduce_16(val, _values, result)
        result = Node.new(:DESCENDANT_SELECTOR, [val.first, val.last])
      
    result
end

#_reduce_18(val, _values, result) ⇒ Object

reduce 17 omitted


427
428
429
430
# File 'lib/nokogiri/css/parser.rb', line 427

def _reduce_18(val, _values, result)
 result = Node.new(:CLASS_CONDITION, [unescape_css_identifier(val[1])]) 
    result
end

#_reduce_2(val, _values, result) ⇒ Object


340
341
342
343
# File 'lib/nokogiri/css/parser.rb', line 340

def _reduce_2(val, _values, result)
 result = val.flatten 
    result
end

#_reduce_20(val, _values, result) ⇒ Object

reduce 19 omitted


434
435
436
437
# File 'lib/nokogiri/css/parser.rb', line 434

def _reduce_20(val, _values, result)
 result = Node.new(:ELEMENT_NAME, val) 
    result
end

#_reduce_21(val, _values, result) ⇒ Object


439
440
441
442
443
444
445
# File 'lib/nokogiri/css/parser.rb', line 439

def _reduce_21(val, _values, result)
        result = Node.new(:ELEMENT_NAME,
          [[val.first, val.last].compact.join(':')]
        )
      
    result
end

#_reduce_22(val, _values, result) ⇒ Object


447
448
449
450
451
452
# File 'lib/nokogiri/css/parser.rb', line 447

def _reduce_22(val, _values, result)
        name = @namespaces.key?('xmlns') ? "xmlns:#{val.first}" : val.first
        result = Node.new(:ELEMENT_NAME, [name])
      
    result
end

#_reduce_23(val, _values, result) ⇒ Object


454
455
456
457
# File 'lib/nokogiri/css/parser.rb', line 454

def _reduce_23(val, _values, result)
 result = val[0] 
    result
end

#_reduce_25(val, _values, result) ⇒ Object

reduce 24 omitted


461
462
463
464
465
466
467
# File 'lib/nokogiri/css/parser.rb', line 461

def _reduce_25(val, _values, result)
        result = Node.new(:ATTRIBUTE_CONDITION,
          [val[1]] + (val[2] || [])
        )
      
    result
end

#_reduce_26(val, _values, result) ⇒ Object


469
470
471
472
473
474
475
# File 'lib/nokogiri/css/parser.rb', line 469

def _reduce_26(val, _values, result)
        result = Node.new(:ATTRIBUTE_CONDITION,
          [val[1]] + (val[2] || [])
        )
      
    result
end

#_reduce_27(val, _values, result) ⇒ Object


477
478
479
480
481
482
483
484
# File 'lib/nokogiri/css/parser.rb', line 477

def _reduce_27(val, _values, result)
        # Non standard, but hpricot supports it.
        result = Node.new(:PSEUDO_CLASS,
          [Node.new(:FUNCTION, ['nth-child(', val[1]])]
        )
      
    result
end

#_reduce_28(val, _values, result) ⇒ Object


486
487
488
489
490
491
492
# File 'lib/nokogiri/css/parser.rb', line 486

def _reduce_28(val, _values, result)
        result = Node.new(:ELEMENT_NAME,
          [[val.first, val.last].compact.join(':')]
        )
      
    result
end

#_reduce_29(val, _values, result) ⇒ Object


494
495
496
497
498
499
500
# File 'lib/nokogiri/css/parser.rb', line 494

def _reduce_29(val, _values, result)
        # Default namespace is not applied to attributes.
        # So we don't add prefix "xmlns:" as in namespaced_ident.
        result = Node.new(:ELEMENT_NAME, [val.first])
      
    result
end

#_reduce_3(val, _values, result) ⇒ Object


345
346
347
348
# File 'lib/nokogiri/css/parser.rb', line 345

def _reduce_3(val, _values, result)
 result = [val.last].flatten 
    result
end

#_reduce_30(val, _values, result) ⇒ Object


502
503
504
505
506
# File 'lib/nokogiri/css/parser.rb', line 502

def _reduce_30(val, _values, result)
        result = Node.new(:FUNCTION, [val.first.strip])
      
    result
end

#_reduce_31(val, _values, result) ⇒ Object


508
509
510
511
512
# File 'lib/nokogiri/css/parser.rb', line 508

def _reduce_31(val, _values, result)
        result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)
      
    result
end

#_reduce_32(val, _values, result) ⇒ Object


514
515
516
517
518
# File 'lib/nokogiri/css/parser.rb', line 514

def _reduce_32(val, _values, result)
        result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)
      
    result
end

#_reduce_33(val, _values, result) ⇒ Object


520
521
522
523
524
# File 'lib/nokogiri/css/parser.rb', line 520

def _reduce_33(val, _values, result)
        result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)
      
    result
end

#_reduce_34(val, _values, result) ⇒ Object


526
527
528
529
530
# File 'lib/nokogiri/css/parser.rb', line 526

def _reduce_34(val, _values, result)
        result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)
      
    result
end

#_reduce_35(val, _values, result) ⇒ Object


532
533
534
535
# File 'lib/nokogiri/css/parser.rb', line 532

def _reduce_35(val, _values, result)
 result = [val.first, val.last] 
    result
end

#_reduce_36(val, _values, result) ⇒ Object


537
538
539
540
# File 'lib/nokogiri/css/parser.rb', line 537

def _reduce_36(val, _values, result)
 result = [val.first, val.last] 
    result
end

#_reduce_37(val, _values, result) ⇒ Object


542
543
544
545
# File 'lib/nokogiri/css/parser.rb', line 542

def _reduce_37(val, _values, result)
 result = [val.first, val.last] 
    result
end

#_reduce_4(val, _values, result) ⇒ Object


350
351
352
353
# File 'lib/nokogiri/css/parser.rb', line 350

def _reduce_4(val, _values, result)
 result = :DIRECT_ADJACENT_SELECTOR 
    result
end

#_reduce_40(val, _values, result) ⇒ Object

reduce 39 omitted


551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
# File 'lib/nokogiri/css/parser.rb', line 551

def _reduce_40(val, _values, result)
        case val[0]
        when 'even'
          result = Node.new(:NTH, ['2','n','+','0'])
        when 'odd'
          result = Node.new(:NTH, ['2','n','+','1'])
        when 'n'
          result = Node.new(:NTH, ['1','n','+','0'])
        else
          # This is not CSS standard.  It allows us to support this:
          # assert_xpath("//a[foo(., @href)]", @parser.parse('a:foo(@href)'))
          # assert_xpath("//a[foo(., @a, b)]", @parser.parse('a:foo(@a, b)'))
          # assert_xpath("//a[foo(., a, 10)]", @parser.parse('a:foo(a, 10)'))
          result = val
        end
      
    result
end

#_reduce_41(val, _values, result) ⇒ Object


570
571
572
573
574
575
576
577
578
# File 'lib/nokogiri/css/parser.rb', line 570

def _reduce_41(val, _values, result)
        if val[1] == 'n'
          result = Node.new(:NTH, val)
        else
          raise Racc::ParseError, "parse error on IDENT '#{val[1]}'"
        end
      
    result
end

#_reduce_42(val, _values, result) ⇒ Object


580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
# File 'lib/nokogiri/css/parser.rb', line 580

def _reduce_42(val, _values, result)
               # n+3, -n+3
        if val[0] == 'n'
          val.unshift("1")
          result = Node.new(:NTH, val)
        elsif val[0] == '-n'
          val[0] = 'n'
          val.unshift("-1")
          result = Node.new(:NTH, val)
        else
          raise Racc::ParseError, "parse error on IDENT '#{val[1]}'"
        end
      
    result
end

#_reduce_43(val, _values, result) ⇒ Object


596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
# File 'lib/nokogiri/css/parser.rb', line 596

def _reduce_43(val, _values, result)
                    # 5n, -5n, 10n-1
        n = val[1]
        if n[0, 2] == 'n-'
          val[1] = 'n'
          val << "-"
          # b is contained in n as n is the string "n-b"
          val << n[2, n.size]
          result = Node.new(:NTH, val)
        elsif n == 'n'
          val << "+"
          val << "0"
          result = Node.new(:NTH, val)
        else
          raise Racc::ParseError, "parse error on IDENT '#{val[1]}'"
        end
      
    result
end

#_reduce_44(val, _values, result) ⇒ Object


616
617
618
619
620
# File 'lib/nokogiri/css/parser.rb', line 616

def _reduce_44(val, _values, result)
        result = Node.new(:PSEUDO_CLASS, [val[1]])
      
    result
end

#_reduce_45(val, _values, result) ⇒ Object


622
623
624
625
# File 'lib/nokogiri/css/parser.rb', line 622

def _reduce_45(val, _values, result)
 result = Node.new(:PSEUDO_CLASS, [val[1]]) 
    result
end

#_reduce_48(val, _values, result) ⇒ Object

reduce 47 omitted


631
632
633
634
635
# File 'lib/nokogiri/css/parser.rb', line 631

def _reduce_48(val, _values, result)
        result = Node.new(:COMBINATOR, val)
      
    result
end

#_reduce_49(val, _values, result) ⇒ Object


637
638
639
640
641
# File 'lib/nokogiri/css/parser.rb', line 637

def _reduce_49(val, _values, result)
        result = Node.new(:COMBINATOR, val)
      
    result
end

#_reduce_5(val, _values, result) ⇒ Object


355
356
357
358
# File 'lib/nokogiri/css/parser.rb', line 355

def _reduce_5(val, _values, result)
 result = :CHILD_SELECTOR 
    result
end

#_reduce_50(val, _values, result) ⇒ Object


643
644
645
646
647
# File 'lib/nokogiri/css/parser.rb', line 643

def _reduce_50(val, _values, result)
        result = Node.new(:COMBINATOR, val)
      
    result
end

#_reduce_51(val, _values, result) ⇒ Object


649
650
651
652
653
# File 'lib/nokogiri/css/parser.rb', line 649

def _reduce_51(val, _values, result)
        result = Node.new(:COMBINATOR, val)
      
    result
end

#_reduce_52(val, _values, result) ⇒ Object


655
656
657
658
659
# File 'lib/nokogiri/css/parser.rb', line 655

def _reduce_52(val, _values, result)
        result = Node.new(:COMBINATOR, val)
      
    result
end

#_reduce_58(val, _values, result) ⇒ Object

reduce 57 omitted


671
672
673
674
# File 'lib/nokogiri/css/parser.rb', line 671

def _reduce_58(val, _values, result)
 result = Node.new(:ID, [unescape_css_identifier(val.first)]) 
    result
end

#_reduce_59(val, _values, result) ⇒ Object


676
677
678
679
# File 'lib/nokogiri/css/parser.rb', line 676

def _reduce_59(val, _values, result)
 result = [val.first, unescape_css_identifier(val[1])] 
    result
end

#_reduce_6(val, _values, result) ⇒ Object


360
361
362
363
# File 'lib/nokogiri/css/parser.rb', line 360

def _reduce_6(val, _values, result)
 result = :FOLLOWING_SELECTOR 
    result
end

#_reduce_60(val, _values, result) ⇒ Object


681
682
683
684
# File 'lib/nokogiri/css/parser.rb', line 681

def _reduce_60(val, _values, result)
 result = [val.first, unescape_css_string(val[1])] 
    result
end

#_reduce_61(val, _values, result) ⇒ Object


686
687
688
689
# File 'lib/nokogiri/css/parser.rb', line 686

def _reduce_61(val, _values, result)
 result = [val.first, val[1]] 
    result
end

#_reduce_63(val, _values, result) ⇒ Object

reduce 62 omitted


693
694
695
696
# File 'lib/nokogiri/css/parser.rb', line 693

def _reduce_63(val, _values, result)
 result = :equal 
    result
end

#_reduce_64(val, _values, result) ⇒ Object


698
699
700
701
# File 'lib/nokogiri/css/parser.rb', line 698

def _reduce_64(val, _values, result)
 result = :prefix_match 
    result
end

#_reduce_65(val, _values, result) ⇒ Object


703
704
705
706
# File 'lib/nokogiri/css/parser.rb', line 703

def _reduce_65(val, _values, result)
 result = :suffix_match 
    result
end

#_reduce_66(val, _values, result) ⇒ Object


708
709
710
711
# File 'lib/nokogiri/css/parser.rb', line 708

def _reduce_66(val, _values, result)
 result = :substring_match 
    result
end

#_reduce_67(val, _values, result) ⇒ Object


713
714
715
716
# File 'lib/nokogiri/css/parser.rb', line 713

def _reduce_67(val, _values, result)
 result = :not_equal 
    result
end

#_reduce_68(val, _values, result) ⇒ Object


718
719
720
721
# File 'lib/nokogiri/css/parser.rb', line 718

def _reduce_68(val, _values, result)
 result = :includes 
    result
end

#_reduce_69(val, _values, result) ⇒ Object


723
724
725
726
# File 'lib/nokogiri/css/parser.rb', line 723

def _reduce_69(val, _values, result)
 result = :dash_match 
    result
end

#_reduce_7(val, _values, result) ⇒ Object


365
366
367
368
# File 'lib/nokogiri/css/parser.rb', line 365

def _reduce_7(val, _values, result)
 result = :DESCENDANT_SELECTOR 
    result
end

#_reduce_70(val, _values, result) ⇒ Object


728
729
730
731
732
# File 'lib/nokogiri/css/parser.rb', line 728

def _reduce_70(val, _values, result)
        result = Node.new(:NOT, [val[1]])
      
    result
end

#_reduce_8(val, _values, result) ⇒ Object


370
371
372
373
# File 'lib/nokogiri/css/parser.rb', line 370

def _reduce_8(val, _values, result)
 result = :CHILD_SELECTOR 
    result
end

#_reduce_9(val, _values, result) ⇒ Object


375
376
377
378
379
380
381
382
383
# File 'lib/nokogiri/css/parser.rb', line 375

def _reduce_9(val, _values, result)
        result =  if val[1].nil?
                    val.first
                  else
                    Node.new(:CONDITIONAL_SELECTOR, [val.first, val[1]])
                  end
      
    result
end

#_reduce_none(val, _values, result) ⇒ Object

reduce 75 omitted


744
745
746
# File 'lib/nokogiri/css/parser.rb', line 744

def _reduce_none(val, _values, result)
  val[0]
end

#next_tokenObject


65
66
67
# File 'lib/nokogiri/css/parser_extras.rb', line 65

def next_token
  @tokenizer.next_token
end

#on_error(error_token_id, error_value, value_stack) ⇒ Object

On CSS parser error, raise an exception

Raises:


85
86
87
88
# File 'lib/nokogiri/css/parser_extras.rb', line 85

def on_error error_token_id, error_value, value_stack
  after = value_stack.compact.last
  raise SyntaxError.new("unexpected '#{error_value}' after '#{after}'")
end

#parse(string) ⇒ Object


60
61
62
63
# File 'lib/nokogiri/css/parser_extras.rb', line 60

def parse string
  @tokenizer.scan_setup string
  do_parse
end

#unescape_css_identifier(identifier) ⇒ Object


17
18
19
# File 'lib/nokogiri/css/parser.rb', line 17

def unescape_css_identifier(identifier)
  identifier.gsub(/\\(?:([^0-9a-fA-F])|([0-9a-fA-F]{1,6})\s?)/){ |m| $1 || [$2.hex].pack('U') }
end

#unescape_css_string(str) ⇒ Object


21
22
23
24
25
26
27
28
29
# File 'lib/nokogiri/css/parser.rb', line 21

def unescape_css_string(str)
  str.gsub(/\\(?:([^0-9a-fA-F])|([0-9a-fA-F]{1,6})\s?)/) do |m|
    if $1=="\n"
      ''
    else
      $1 || [$2.hex].pack('U')
    end
  end
end

#xpath_for(string, options = {}) ⇒ Object

Get the xpath for string using options


70
71
72
73
74
75
76
77
78
79
80
81
82
# File 'lib/nokogiri/css/parser_extras.rb', line 70

def xpath_for string, options={}
  key = "#{string}#{options[:ns]}#{options[:prefix]}"
  v = self.class[key]
  return v if v

  args = [
    options[:prefix] || '//',
    options[:visitor] || XPathVisitor.new
  ]
  self.class[key] = parse(string).map { |ast|
    ast.to_xpath(*args)
  }
end