🏡 index : github.com/captn3m0/cosmere-books.git

require "./spec_helper"

describe Lexbor::Node do
  it "select_tags" do
    parser = Lexbor::Parser.new("<html><body><div class=AAA style='color:red'>Haha</div>
      <div>blah</div>
      </body></html>")

    parser.nodes(Lexbor::Lib::TagIdT::LXB_TAG_DIV).size.should eq 2
    parser.nodes(:div).size.should eq 2
    parser.nodes("div").size.should eq 2
    nodes = parser.nodes(Lexbor::Lib::TagIdT::LXB_TAG_DIV).to_a
    nodes.size.should eq 2

    node1, node2 = nodes
    node1.child!.tag_text.should eq "Haha"
    node2.child!.tag_text.should eq "blah"

    nodes = parser.nodes(:div).to_a
    nodes.size.should eq 2
  end

  it "each_tag" do
    parser = Lexbor::Parser.new("<html><body><div class=AAA style='color:red'>Haha</div>
      <div>blah</div>
      </body></html>")

    nodes = [] of Lexbor::Node
    parser.nodes(Lexbor::Lib::TagIdT::LXB_TAG_DIV).each { |n| nodes << n }
    nodes.size.should eq 2

    node1, node2 = nodes
    node1.child!.tag_text.should eq "Haha"
    node2.child!.tag_text.should eq "blah"

    nodes = [] of Lexbor::Node
    parser.nodes(:div).each { |n| nodes << n }
    nodes.size.should eq 2
  end

  it "correctly works with unicode" do
    str = <<-HTML
      <html>
      <head>
        <meta name="keywords" content="аа, ааааааааааа, ааааааааа, ааа, ааааааа, ааааааааа"  />
      </head>

      <body id='normal' >
        <a href="http://aaaa-aaa.ru/">#</a>
      </body></html>
    HTML

    parser = Lexbor::Parser.new(str)
    parser.nodes(Lexbor::Lib::TagIdT::LXB_TAG_A).size.should eq 1
    parser.nodes(:a).size.should eq 1
    parser.nodes("a").size.should eq 1
  end

  it "parse html with bom" do
    slice = Slice.new(3, 0_u8)
    slice[0] = 0xef.to_u8
    slice[1] = 0xbb.to_u8
    slice[2] = 0xbf.to_u8
    str = String.new(slice)
    str += "<html><head><title>1</title></head></html>"

    if bom = Lexbor::Utils::DetectEncoding.detect_bom(str.to_slice)
      str = String.new(bom.shifted(str.to_slice))
    end

    parser = Lexbor::Parser.new(str)

    title = parser.head!.child!
    title.tag_name.should eq "title"
    title.child.try(&.tag_text).should eq "1"
  end

  it "manually call free, to save memory" do
    10000.times do
      parser = Lexbor::Parser.new("<html><body><div class=AAA style='color:red'>Haha</div>
        <div>blah</div>
        </body></html>")
      parser.free
    end
  end

  it "raise when non supported tag name is given by String" do
    parser = Lexbor::Parser.new("<html></html>")
    expect_raises(Lexbor::Error, /Unknown tag "xxx"/) { parser.nodes("xxx") }
  end

  it "not sigfaulting on more than 1024 elements" do
    str = "<html>" + "<div class=A>ooo</div>" * 2000 + "</html>"
    parser = Lexbor::Parser.new(str)

    c = 0
    parser.nodes(:div).each do |node|
      c += 1 if node.attribute_by("class") == "A"
    end
    c.should eq 2000
  end

  it "parse_stream" do
    str = "<html><body>" + "<div class=A>ooo</div>" * 2000 + "</body></html>"
    io = IO::Memory.new(str)

    parser = Lexbor::Parser.new(io)
    c = 0
    parser.nodes(:div).each do |node|
      c += 1 if node.attribute_by("class") == "A"
    end
    c.should eq 2000
  end

  it "to_html" do
    origin = <<-HTML
      <!doctype html>
      <html lang=en>
        <head>
         <title></title>
        </head>
        <body> </body>
      </html>
    HTML
    parser = Lexbor::Parser.new(origin)
    parser.to_html.should eq "<!DOCTYPE html><html lang=\"en\"><head>\n     <title></title>\n    </head>\n    <body> \n  </body></html>"
  end

  describe "#create_node" do
    it "returns a new Lexbor::Node" do
      tree = Lexbor::Parser.new ""

      node = tree.create_node(:a)

      node.should be_a(Lexbor::Node)
      node.tag_id.should eq(Lexbor::Lib::TagIdT::LXB_TAG_A)
    end

    it "create node with attributes and text" do
      tree = Lexbor::Parser.new ""
      node = tree.create_node(:a)
      node.attribute_add("id", "bla")
      node.attribute_add("class", "red")
      node.to_html.should eq "<a id=\"bla\" class=\"red\"></a>"

      node.inner_text = "some text"

      node.to_html.should eq "<a id=\"bla\" class=\"red\">some text</a>"
    end
  end

  it "nodes iterator works with doctype" do
    parser = Lexbor::Parser.new("<!doctype html><html><body><div class=AAA style='color:red'>Haha</div>
      <div>blah</div>
      </body></html>")

    parser.nodes(Lexbor::Lib::TagIdT::LXB_TAG_DIV).size.should eq 2
    parser.nodes(:div).size.should eq 2
    parser.nodes("div").size.should eq 2
  end

  describe "root element" do
    it do
      m = Lexbor::Parser.new(%q{<!DOCTYPE html><html></html>})
      m.root!.tag_sym.should eq :html
    end
  end
end