require("luarocks.loader")
-- Omit next line in actual module clients; it's only to support development of the module itself
package.path = "../src/?.lua;" .. package.path
local lunitx = require("lunitx")
module("html", lunitx.testcase, package.seeall)
local htmlparser = require("htmlparser")
function test_void()
local tree = htmlparser.parse([[
]])
assert_equal(5, #tree.nodes, "top level")
for _,n in ipairs(tree.nodes) do
if n.name == "p" then
assert_equal(4, #n.nodes, "deeper level")
else
assert_equal("br", n.name, "name")
assert_equal("", n:getcontent(), "content")
end
end
end
function test_id()
local tree = htmlparser.parse([[
]])
assert_equal(1, #tree.nodes, "top level")
assert_equal("n", tree("#4711")[1].name, "#4711")
assert_equal("m", tree("#1174")[1].name, "#1174")
end
function test_class()
local tree = htmlparser.parse([[
]])
assert_equal(3, #tree.nodes, "top level")
assert_equal(1, #tree(".one"), ".one")
assert_equal(2, #tree(".two"), ".two")
assert_equal(2, #tree(".three"), ".three")
assert_equal(1, #tree(".two.three"), ".two.three")
assert_equal(0, #tree(".four"), ".four")
end
function test_attr()
local tree = htmlparser.parse([[
]])
assert_equal(1, #tree.nodes, "top level")
assert(tree("[a1]")[1], "a1")
assert(tree("[a2]")[1], "a2")
assert(tree("[a3]")[1], "a3")
assert(tree("[a4]")[1], "a4")
assert(tree("[a5]")[1], "a5")
assert(tree("[a6]")[1], "a6")
assert(tree("[a7]")[1], "a7")
assert(tree("[a8]")[1], "a8")
assert(tree("[a9]")[1], "a9")
assert(tree("[a10]")[1], "a10")
end
function test_attr_equal()
local tree = htmlparser.parse([[
]])
assert_equal(1, #tree.nodes, "top level")
assert(tree("[a1='']")[1], "a1=''")
assert(tree("[a2='']")[1], "a2=''")
assert(tree("[a3='']")[1], "a3=''")
assert(tree("[a4='']")[1], "a4=''")
assert(tree("[a5='a\"5\"']")[1], "a5='a\"5\"'")
assert(tree("[a6=\"a'6'\"]")[1], "a6=\"a'6'\"")
-- not these characters
-- (because these have a special meaning as id, class, or attribute selector, hierarchy separator, or filter command)
-- they can occur in the HTML, but not in a selector string
-- assert(tree("[a7='#.[] :()']")[n], "a7='#.[] :()'")
assert(tree("[a8='|*+-=?$^%&/']")[1], "a8='|*+-=?$^%&/'")
assert(tree("[a9='a9']")[1], "a9='a9'")
assert(tree("[a10='']")[1], "a10=''")
assert(tree("[a10=]")[1], "a10=")
end
function test_attr_notequal()
local tree = htmlparser.parse([[
]])
assert_equal(4, #tree.nodes, "top level")
assert_equal(3, #tree("[a1!='a1']"), "a1!='a1'")
assert_equal(4, #tree("[a1!='b1']"), "a1!='b1'")
assert_equal(3, #tree("[a1!='']"), "a1!=''")
assert_equal(3, #tree("[a1!=]"), "a1!=")
end
function test_attr_prefix_start_end()
local tree = htmlparser.parse([[
]])
assert_equal(5, #tree.nodes, "top level")
assert_equal(3, #tree("[a1|='en']"), "a1|='en'")
assert_equal(4, #tree("[a1^='en']"), "a1^='en'")
assert_equal(2, #tree("[a1$='en']"), "a1$='en'")
end
function test_attr_word()
local tree = htmlparser.parse([[
]])
assert_equal(4, #tree.nodes, "top level")
assert_equal(1, #tree("[a1~='two']"), "a1~='two'")
assert_equal(2, #tree("[a1~='three']"), "a1~='three'")
assert_equal(1, #tree("[a1~='four']"), "a1~='four'")
end
function test_attr_contains()
local tree = htmlparser.parse([[
]])
assert_equal(6, #tree.nodes, "top level")
assert_equal(2, #tree("[a1*='one']"), "a1*='one'")
assert_equal(2, #tree("[a1*='t']"), "a1*='t'")
assert_equal(1, #tree("[a1*='f']"), "a1*='f'")
assert_equal(5, #tree("[a1*='']"), "a1*=''")
assert_equal(5, #tree("[a1*=]"), "a1*=")
end
function test_descendants()
local tree = htmlparser.parse([[
1
1
2
3
4
2
5
6
7
8
not
]])
assert_equal(8, #tree("parent child"), 'parent child')
end
function test_children()
local tree = htmlparser.parse([[
1
1
2
not
not
2
3
4
not
not
not
]])
assert_equal(4, #tree("parent > child"), 'parent > child')
end
function test_not()
local tree = htmlparser.parse([[
]])
assert_equal(2, #tree.nodes, "top level")
assert_equal(1, #tree(":not([a1=1])"), ":not([a1=1])")
assert_equal(1, #tree(":not([a2])"), ":not([a2])")
assert_equal(1, #tree(":not(n)"), ":not(n)")
assert_equal(2, #tree(":not(m)"), ":not(m)")
end
function test_combine()
local tree = htmlparser.parse([[
]])
assert_equal(2, #tree.nodes, "top level")
assert_equal(2, #tree("e.c:not([a|='1']) > n[b*='2']"), "e.c:not([a|='1']) > n[b*='2']")
assert_equal(3, #tree("e.c:not([a|='1']) n[b*='2']"), "e.c:not([a|='1']) n[b*='2']")
assert_equal(1, #tree("#123 .c[b]"), "#123 .c[b]")
end
function test_order()
local tree = htmlparser.parse([[
<1>
1
<2>
2
3
<3>
4
5
6
<4>
7
8
9
10
4>
3>
2>
1>
]])
assert_equal(1, #tree.nodes, "top level")
local n = tree("n")
assert_equal(10, #n, "n")
for i,v in pairs(n) do
assert_equal(i, tonumber(v:getcontent()), "n order")
end
local notn = tree(":not(n)")
assert_equal(4, #notn, "notn")
for i,v in pairs(notn) do
assert_equal(i, tonumber(v.name), "notn order")
end
end