Class: Nokogiri::CSS::Parser

Inherits:
Racc::Parser
  • Object
show all
Defined in:
lib/nokogiri/css/parser.rb,
lib/nokogiri/css/parser_extras.rb

Constant Summary collapse

Racc_arg =
[
  racc_action_table,
  racc_action_check,
  racc_action_default,
  racc_action_pointer,
  racc_goto_table,
  racc_goto_check,
  racc_goto_default,
  racc_goto_pointer,
  racc_nt_base,
  racc_reduce_table,
  racc_token_table,
  racc_shift_n,
  racc_reduce_n,
  racc_use_result_var,
]
Racc_token_to_s_table =
[
  "$end",
  "error",
  "FUNCTION",
  "INCLUDES",
  "DASHMATCH",
  "LBRACE",
  "HASH",
  "PLUS",
  "GREATER",
  "S",
  "STRING",
  "IDENT",
  "COMMA",
  "NUMBER",
  "PREFIXMATCH",
  "SUFFIXMATCH",
  "SUBSTRINGMATCH",
  "TILDE",
  "NOT_EQUAL",
  "SLASH",
  "DOUBLESLASH",
  "NOT",
  "EQUAL",
  "RPAREN",
  "LSQUARE",
  "RSQUARE",
  "HAS",
  "\".\"",
  "\"*\"",
  "\"|\"",
  "\":\"",
  "$start",
  "selector",
  "simple_selector_1toN",
  "prefixless_combinator_selector",
  "optional_S",
  "combinator",
  "simple_selector",
  "element_name",
  "hcap_0toN",
  "function",
  "pseudo",
  "attrib",
  "hcap_1toN",
  "class",
  "namespaced_ident",
  "namespace",
  "attrib_name",
  "attrib_val_0or1",
  "expr",
  "nth",
  "attribute_id",
  "negation",
  "eql_incl_dash",
  "negation_arg",
]
Racc_debug_parser =
false

Class Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(namespaces = {}) ⇒ Parser

Create a new CSS parser with respect to namespaces



54
55
56
57
58
# File 'lib/nokogiri/css/parser_extras.rb', line 54

def initialize namespaces = {}
  @tokenizer  = Tokenizer.new
  @namespaces = namespaces
  super()
end

Class Attribute Details

.cache_onObject Also known as: cache_on?

Turn on CSS parse caching



12
13
14
# File 'lib/nokogiri/css/parser_extras.rb', line 12

def cache_on
  @cache_on
end

Class Method Details

.[](string) ⇒ Object

Get the css selector in string from the cache



17
18
19
20
# File 'lib/nokogiri/css/parser_extras.rb', line 17

def [] string
  return unless @cache_on
  @mutex.synchronize { @cache[string] }
end

.[]=(string, value) ⇒ Object

Set the css selector in string in the cache to value



23
24
25
26
# File 'lib/nokogiri/css/parser_extras.rb', line 23

def []= string, value
  return value unless @cache_on
  @mutex.synchronize { @cache[string] = value }
end

.clear_cacheObject

Clear the cache



29
30
31
# File 'lib/nokogiri/css/parser_extras.rb', line 29

def clear_cache
  @mutex.synchronize { @cache = {} }
end

.parse(selector) ⇒ Object

Parse this CSS selector in selector. Returns an AST.



43
44
45
46
47
48
49
50
# File 'lib/nokogiri/css/parser_extras.rb', line 43

def parse selector
  @warned ||= false
  unless @warned
    $stderr.puts('Nokogiri::CSS::Parser.parse is deprecated, call Nokogiri::CSS.parse(), this will be removed August 1st or version 1.4.0 (whichever is first)')
    @warned = true
  end
  new.parse selector
end

.without_cache(&block) ⇒ Object

Execute block without cache



34
35
36
37
38
39
# File 'lib/nokogiri/css/parser_extras.rb', line 34

def without_cache &block
  tmp = @cache_on
  @cache_on = false
  block.call
  @cache_on = tmp
end

Instance Method Details

#_reduce_1(val, _values, result) ⇒ Object

reduce 0 omitted



352
353
354
355
356
# File 'lib/nokogiri/css/parser.rb', line 352

def _reduce_1(val, _values, result)
  result = [val.first, val.last].flatten

  result
end

#_reduce_11(val, _values, result) ⇒ Object

reduce 10 omitted



405
406
407
408
409
# File 'lib/nokogiri/css/parser.rb', line 405

def _reduce_11(val, _values, result)
  result = Node.new(:CONDITIONAL_SELECTOR, val)

  result
end

#_reduce_12(val, _values, result) ⇒ Object



411
412
413
414
415
# File 'lib/nokogiri/css/parser.rb', line 411

def _reduce_12(val, _values, result)
  result = Node.new(:CONDITIONAL_SELECTOR, val)

  result
end

#_reduce_13(val, _values, result) ⇒ Object



417
418
419
420
421
422
# File 'lib/nokogiri/css/parser.rb', line 417

def _reduce_13(val, _values, result)
  result = Node.new(:CONDITIONAL_SELECTOR,
                    [Node.new(:ELEMENT_NAME, ["*"]), val.first])

  result
end

#_reduce_14(val, _values, result) ⇒ Object



424
425
426
427
428
# File 'lib/nokogiri/css/parser.rb', line 424

def _reduce_14(val, _values, result)
  result = Node.new(val.first, [nil, val.last])

  result
end

#_reduce_15(val, _values, result) ⇒ Object



430
431
432
433
434
# File 'lib/nokogiri/css/parser.rb', line 430

def _reduce_15(val, _values, result)
  result = Node.new(val[1], [val.first, val.last])

  result
end

#_reduce_16(val, _values, result) ⇒ Object



436
437
438
439
440
# File 'lib/nokogiri/css/parser.rb', line 436

def _reduce_16(val, _values, result)
  result = Node.new(:DESCENDANT_SELECTOR, [val.first, val.last])

  result
end

#_reduce_18(val, _values, result) ⇒ Object

reduce 17 omitted



444
445
446
447
# File 'lib/nokogiri/css/parser.rb', line 444

def _reduce_18(val, _values, result)
  result = Node.new(:CLASS_CONDITION, [unescape_css_identifier(val[1])])
  result
end

#_reduce_2(val, _values, result) ⇒ Object



358
359
360
361
# File 'lib/nokogiri/css/parser.rb', line 358

def _reduce_2(val, _values, result)
  result = val.flatten
  result
end

#_reduce_20(val, _values, result) ⇒ Object

reduce 19 omitted



451
452
453
454
# File 'lib/nokogiri/css/parser.rb', line 451

def _reduce_20(val, _values, result)
  result = Node.new(:ELEMENT_NAME, val)
  result
end

#_reduce_21(val, _values, result) ⇒ Object



456
457
458
459
460
461
# File 'lib/nokogiri/css/parser.rb', line 456

def _reduce_21(val, _values, result)
  result = Node.new(:ELEMENT_NAME,
                    [[val.first, val.last].compact.join(":")])

  result
end

#_reduce_22(val, _values, result) ⇒ Object



463
464
465
466
467
468
# File 'lib/nokogiri/css/parser.rb', line 463

def _reduce_22(val, _values, result)
  name = @namespaces.key?("xmlns") ? "xmlns:#{val.first}" : val.first
  result = Node.new(:ELEMENT_NAME, [name])

  result
end

#_reduce_23(val, _values, result) ⇒ Object



470
471
472
473
# File 'lib/nokogiri/css/parser.rb', line 470

def _reduce_23(val, _values, result)
  result = val[0]
  result
end

#_reduce_25(val, _values, result) ⇒ Object

reduce 24 omitted



477
478
479
480
481
482
# File 'lib/nokogiri/css/parser.rb', line 477

def _reduce_25(val, _values, result)
  result = Node.new(:ATTRIBUTE_CONDITION,
                    [val[1]] + (val[2] || []))

  result
end

#_reduce_26(val, _values, result) ⇒ Object



484
485
486
487
488
489
# File 'lib/nokogiri/css/parser.rb', line 484

def _reduce_26(val, _values, result)
  result = Node.new(:ATTRIBUTE_CONDITION,
                    [val[1]] + (val[2] || []))

  result
end

#_reduce_27(val, _values, result) ⇒ Object



491
492
493
494
495
496
497
# File 'lib/nokogiri/css/parser.rb', line 491

def _reduce_27(val, _values, result)
  # Non standard, but hpricot supports it.
  result = Node.new(:PSEUDO_CLASS,
                    [Node.new(:FUNCTION, ["nth-child(", val[1]])])

  result
end

#_reduce_28(val, _values, result) ⇒ Object



499
500
501
502
503
504
# File 'lib/nokogiri/css/parser.rb', line 499

def _reduce_28(val, _values, result)
  result = Node.new(:ELEMENT_NAME,
                    [[val.first, val.last].compact.join(":")])

  result
end

#_reduce_29(val, _values, result) ⇒ Object



506
507
508
509
510
511
512
# File 'lib/nokogiri/css/parser.rb', line 506

def _reduce_29(val, _values, result)
  # Default namespace is not applied to attributes.
  # So we don't add prefix "xmlns:" as in namespaced_ident.
  result = Node.new(:ELEMENT_NAME, [val.first])

  result
end

#_reduce_3(val, _values, result) ⇒ Object



363
364
365
366
# File 'lib/nokogiri/css/parser.rb', line 363

def _reduce_3(val, _values, result)
  result = [val.last].flatten
  result
end

#_reduce_30(val, _values, result) ⇒ Object



514
515
516
517
518
# File 'lib/nokogiri/css/parser.rb', line 514

def _reduce_30(val, _values, result)
  result = Node.new(:FUNCTION, [val.first.strip])

  result
end

#_reduce_31(val, _values, result) ⇒ Object



520
521
522
523
524
# File 'lib/nokogiri/css/parser.rb', line 520

def _reduce_31(val, _values, result)
  result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)

  result
end

#_reduce_32(val, _values, result) ⇒ Object



526
527
528
529
530
# File 'lib/nokogiri/css/parser.rb', line 526

def _reduce_32(val, _values, result)
  result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)

  result
end

#_reduce_33(val, _values, result) ⇒ Object



532
533
534
535
536
# File 'lib/nokogiri/css/parser.rb', line 532

def _reduce_33(val, _values, result)
  result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)

  result
end

#_reduce_34(val, _values, result) ⇒ Object



538
539
540
541
542
# File 'lib/nokogiri/css/parser.rb', line 538

def _reduce_34(val, _values, result)
  result = Node.new(:FUNCTION, [val.first.strip, val[1]].flatten)

  result
end

#_reduce_35(val, _values, result) ⇒ Object



544
545
546
547
# File 'lib/nokogiri/css/parser.rb', line 544

def _reduce_35(val, _values, result)
  result = [val.first, val.last]
  result
end

#_reduce_36(val, _values, result) ⇒ Object



549
550
551
552
# File 'lib/nokogiri/css/parser.rb', line 549

def _reduce_36(val, _values, result)
  result = [val.first, val.last]
  result
end

#_reduce_37(val, _values, result) ⇒ Object



554
555
556
557
# File 'lib/nokogiri/css/parser.rb', line 554

def _reduce_37(val, _values, result)
  result = [val.first, val.last]
  result
end

#_reduce_4(val, _values, result) ⇒ Object



368
369
370
371
# File 'lib/nokogiri/css/parser.rb', line 368

def _reduce_4(val, _values, result)
  result = :DIRECT_ADJACENT_SELECTOR
  result
end

#_reduce_40(val, _values, result) ⇒ Object

reduce 39 omitted



563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
# File 'lib/nokogiri/css/parser.rb', line 563

def _reduce_40(val, _values, result)
  case val[0]
  when "even"
    result = Node.new(:NTH, ["2", "n", "+", "0"])
  when "odd"
    result = Node.new(:NTH, ["2", "n", "+", "1"])
  when "n"
    result = Node.new(:NTH, ["1", "n", "+", "0"])
  else
    # This is not CSS standard.  It allows us to support this:
    # assert_xpath("//a[foo(., @href)]", @parser.parse('a:foo(@href)'))
    # assert_xpath("//a[foo(., @a, b)]", @parser.parse('a:foo(@a, b)'))
    # assert_xpath("//a[foo(., a, 10)]", @parser.parse('a:foo(a, 10)'))
    result = val
  end

  result
end

#_reduce_41(val, _values, result) ⇒ Object



582
583
584
585
586
587
588
589
590
# File 'lib/nokogiri/css/parser.rb', line 582

def _reduce_41(val, _values, result)
  if val[1] == "n"
    result = Node.new(:NTH, val)
  else
    raise Racc::ParseError, "parse error on IDENT '#{val[1]}'"
  end

  result
end

#_reduce_42(val, _values, result) ⇒ Object



592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
# File 'lib/nokogiri/css/parser.rb', line 592

def _reduce_42(val, _values, result)
  # n+3, -n+3
  if val[0] == "n"
    val.unshift("1")
    result = Node.new(:NTH, val)
  elsif val[0] == "-n"
    val[0] = "n"
    val.unshift("-1")
    result = Node.new(:NTH, val)
  else
    raise Racc::ParseError, "parse error on IDENT '#{val[1]}'"
  end

  result
end

#_reduce_43(val, _values, result) ⇒ Object



608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
# File 'lib/nokogiri/css/parser.rb', line 608

def _reduce_43(val, _values, result)
  # 5n, -5n, 10n-1
  n = val[1]
  if n[0, 2] == "n-"
    val[1] = "n"
    val << "-"
    # b is contained in n as n is the string "n-b"
    val << n[2, n.size]
    result = Node.new(:NTH, val)
  elsif n == "n"
    val << "+"
    val << "0"
    result = Node.new(:NTH, val)
  else
    raise Racc::ParseError, "parse error on IDENT '#{val[1]}'"
  end

  result
end

#_reduce_44(val, _values, result) ⇒ Object



628
629
630
631
632
# File 'lib/nokogiri/css/parser.rb', line 628

def _reduce_44(val, _values, result)
  result = Node.new(:PSEUDO_CLASS, [val[1]])

  result
end

#_reduce_45(val, _values, result) ⇒ Object



634
635
636
637
# File 'lib/nokogiri/css/parser.rb', line 634

def _reduce_45(val, _values, result)
  result = Node.new(:PSEUDO_CLASS, [val[1]])
  result
end

#_reduce_48(val, _values, result) ⇒ Object

reduce 47 omitted



643
644
645
646
647
# File 'lib/nokogiri/css/parser.rb', line 643

def _reduce_48(val, _values, result)
  result = Node.new(:COMBINATOR, val)

  result
end

#_reduce_49(val, _values, result) ⇒ Object



649
650
651
652
653
# File 'lib/nokogiri/css/parser.rb', line 649

def _reduce_49(val, _values, result)
  result = Node.new(:COMBINATOR, val)

  result
end

#_reduce_5(val, _values, result) ⇒ Object



373
374
375
376
# File 'lib/nokogiri/css/parser.rb', line 373

def _reduce_5(val, _values, result)
  result = :CHILD_SELECTOR
  result
end

#_reduce_50(val, _values, result) ⇒ Object



655
656
657
658
659
# File 'lib/nokogiri/css/parser.rb', line 655

def _reduce_50(val, _values, result)
  result = Node.new(:COMBINATOR, val)

  result
end

#_reduce_51(val, _values, result) ⇒ Object



661
662
663
664
665
# File 'lib/nokogiri/css/parser.rb', line 661

def _reduce_51(val, _values, result)
  result = Node.new(:COMBINATOR, val)

  result
end

#_reduce_52(val, _values, result) ⇒ Object



667
668
669
670
671
# File 'lib/nokogiri/css/parser.rb', line 667

def _reduce_52(val, _values, result)
  result = Node.new(:COMBINATOR, val)

  result
end

#_reduce_58(val, _values, result) ⇒ Object

reduce 57 omitted



683
684
685
686
# File 'lib/nokogiri/css/parser.rb', line 683

def _reduce_58(val, _values, result)
  result = Node.new(:ID, [unescape_css_identifier(val.first)])
  result
end

#_reduce_59(val, _values, result) ⇒ Object



688
689
690
691
# File 'lib/nokogiri/css/parser.rb', line 688

def _reduce_59(val, _values, result)
  result = [val.first, unescape_css_identifier(val[1])]
  result
end

#_reduce_6(val, _values, result) ⇒ Object



378
379
380
381
# File 'lib/nokogiri/css/parser.rb', line 378

def _reduce_6(val, _values, result)
  result = :FOLLOWING_SELECTOR
  result
end

#_reduce_60(val, _values, result) ⇒ Object



693
694
695
696
# File 'lib/nokogiri/css/parser.rb', line 693

def _reduce_60(val, _values, result)
  result = [val.first, unescape_css_string(val[1])]
  result
end

#_reduce_61(val, _values, result) ⇒ Object



698
699
700
701
# File 'lib/nokogiri/css/parser.rb', line 698

def _reduce_61(val, _values, result)
  result = [val.first, val[1]]
  result
end

#_reduce_63(val, _values, result) ⇒ Object

reduce 62 omitted



705
706
707
708
# File 'lib/nokogiri/css/parser.rb', line 705

def _reduce_63(val, _values, result)
  result = :equal
  result
end

#_reduce_64(val, _values, result) ⇒ Object



710
711
712
713
# File 'lib/nokogiri/css/parser.rb', line 710

def _reduce_64(val, _values, result)
  result = :prefix_match
  result
end

#_reduce_65(val, _values, result) ⇒ Object



715
716
717
718
# File 'lib/nokogiri/css/parser.rb', line 715

def _reduce_65(val, _values, result)
  result = :suffix_match
  result
end

#_reduce_66(val, _values, result) ⇒ Object



720
721
722
723
# File 'lib/nokogiri/css/parser.rb', line 720

def _reduce_66(val, _values, result)
  result = :substring_match
  result
end

#_reduce_67(val, _values, result) ⇒ Object



725
726
727
728
# File 'lib/nokogiri/css/parser.rb', line 725

def _reduce_67(val, _values, result)
  result = :not_equal
  result
end

#_reduce_68(val, _values, result) ⇒ Object



730
731
732
733
# File 'lib/nokogiri/css/parser.rb', line 730

def _reduce_68(val, _values, result)
  result = :includes
  result
end

#_reduce_69(val, _values, result) ⇒ Object



735
736
737
738
# File 'lib/nokogiri/css/parser.rb', line 735

def _reduce_69(val, _values, result)
  result = :dash_match
  result
end

#_reduce_7(val, _values, result) ⇒ Object



383
384
385
386
# File 'lib/nokogiri/css/parser.rb', line 383

def _reduce_7(val, _values, result)
  result = :DESCENDANT_SELECTOR
  result
end

#_reduce_70(val, _values, result) ⇒ Object



740
741
742
743
744
# File 'lib/nokogiri/css/parser.rb', line 740

def _reduce_70(val, _values, result)
  result = Node.new(:NOT, [val[1]])

  result
end

#_reduce_8(val, _values, result) ⇒ Object



388
389
390
391
# File 'lib/nokogiri/css/parser.rb', line 388

def _reduce_8(val, _values, result)
  result = :CHILD_SELECTOR
  result
end

#_reduce_9(val, _values, result) ⇒ Object



393
394
395
396
397
398
399
400
401
# File 'lib/nokogiri/css/parser.rb', line 393

def _reduce_9(val, _values, result)
  result = if val[1].nil?
             val.first
           else
             Node.new(:CONDITIONAL_SELECTOR, [val.first, val[1]])
           end

  result
end

#_reduce_none(val, _values, result) ⇒ Object

reduce 75 omitted



756
757
758
# File 'lib/nokogiri/css/parser.rb', line 756

def _reduce_none(val, _values, result)
  val[0]
end

#next_tokenObject



65
66
67
# File 'lib/nokogiri/css/parser_extras.rb', line 65

def next_token
  @tokenizer.next_token
end

#on_error(error_token_id, error_value, value_stack) ⇒ Object

On CSS parser error, raise an exception

Raises:



85
86
87
88
# File 'lib/nokogiri/css/parser_extras.rb', line 85

def on_error error_token_id, error_value, value_stack
  after = value_stack.compact.last
  raise SyntaxError.new("unexpected '#{error_value}' after '#{after}'")
end

#parse(string) ⇒ Object



60
61
62
63
# File 'lib/nokogiri/css/parser_extras.rb', line 60

def parse string
  @tokenizer.scan_setup string
  do_parse
end

#unescape_css_identifier(identifier) ⇒ Object



22
23
24
# File 'lib/nokogiri/css/parser.rb', line 22

def unescape_css_identifier(identifier)
  identifier.gsub(/\\(?:([^0-9a-fA-F])|([0-9a-fA-F]{1,6})\s?)/) { |m| $1 || [$2.hex].pack("U") }
end

#unescape_css_string(str) ⇒ Object



26
27
28
29
30
31
32
33
34
# File 'lib/nokogiri/css/parser.rb', line 26

def unescape_css_string(str)
  str.gsub(/\\(?:([^0-9a-fA-F])|([0-9a-fA-F]{1,6})\s?)/) do |m|
    if $1 == "\n"
      ""
    else
      $1 || [$2.hex].pack("U")
    end
  end
end

#xpath_for(string, options = {}) ⇒ Object

Get the xpath for string using options



70
71
72
73
74
75
76
77
78
79
80
81
82
# File 'lib/nokogiri/css/parser_extras.rb', line 70

def xpath_for string, options={}
  key = "#{string}#{options[:ns]}#{options[:prefix]}"
  v = self.class[key]
  return v if v

  args = [
    options[:prefix] || '//',
    options[:visitor] || XPathVisitor.new
  ]
  self.class[key] = parse(string).map { |ast|
    ast.to_xpath(*args)
  }
end