module Test_xml =
let knode (r:regexp) = [ key r ]
(************************************************************************
* Utilities lens
*************************************************************************)
(*
let _ = print_regexp(lens_ctype(Xml.text))
let _ = print_endline ""
*)
test Xml.comment get "" =
{ "#comment" = " declarations for
& " }
test Xml.comment get "" = *
test Xml.prolog get "" =
{ "#declaration"
{ "#attribute"
{ "version" = "1.0" }
{ "encoding" = "UTF-8" }
}
}
test Xml.decl_def_item get "" =
{ "!ELEMENT" = "greeting"
{ "#decl" = "(#PCDATA)" }
}
test Xml.decl_def_item get "" =
{ "!ENTITY" = "da"
{ "#decl" = "
" }
}
test Xml.doctype get "" =
{ "!DOCTYPE" = "greeting"
{ "SYSTEM" = "hello.dtd" }
}
test Xml.doctype get "
]>" =
{ "!DOCTYPE" = "foo"
{ "!ELEMENT" = "bar"
{ "#decl" = "(#PCDATA)" }
}
{ "!ELEMENT" = "baz"
{ "#decl" = "(bar)*" }
}
}
let att_def1 = ""
let att_def2 = ""
let att_def3 = ""
test Xml.att_list_def get att_def1 =
{ "!ATTLIST" = "termdef"
{ "1"
{ "#name" = "id" }
{ "#type" = "ID" }
{ "#REQUIRED" }
}
{ "2"
{ "#name" = "name" }
{ "#type" = "CDATA" }
{ "#IMPLIED" }
}
}
test Xml.att_list_def get att_def2 =
{ "!ATTLIST" = "list"
{ "1"
{ "#name" = "type" }
{ "#type" = "(bullets|ordered|glossary)" }
{ "#FIXED" = "ordered" }
}
}
test Xml.att_list_def get att_def3 =
{ "!ATTLIST" = "form"
{ "1"
{ "#name" = "method" }
{ "#type" = "CDATA" }
{ "#FIXED" = "POST" }
}
}
test Xml.notation_def get "" =
{ "!NOTATION" = "not3"
{ "SYSTEM" = "" }
}
let cdata1 = ""
test Xml.cdata get cdata1 = { "#CDATA" = "testing" }
let attr1 = " attr1=\"value1\" attr2=\"value2\""
let attr2 = " attr2=\"foo\""
test Xml.attributes get attr1 =
{ "#attribute"
{ "attr1" = "value1" }
{ "attr2" = "value2" }
}
test Xml.attributes get " refs=\"A1\nA2 A3\"" =
{ "#attribute"
{ "refs" = "A1\nA2 A3" }
}
test Xml.attributes put attr1 after rm "/#attribute[1]";
set "/#attribute/attr2" "foo" = attr2
let empty1 = ""
let empty2 = ""
let empty3 = "\n"
let empty4 = ""
test Xml.empty_element get empty1 = { "a" = "#empty" }
test Xml.empty_element get empty2 =
{ "a" = "#empty" { "#attribute" { "foo" = "bar"} } }
test Xml.empty_element put empty1 after set "/a/#attribute/foo" "bar" = empty2
(* the attribute node must be the first child of the element *)
test Xml.empty_element put empty1 after set "/a/#attribute/foo" "bar";
set "/a/#attribute/far" "baz" = empty4
test Xml.content put "" after clear "/a/b" = "\n"
test Xml.lns put "" after set "/a/#text[1]" "foo";
set "/a/#text[2]" "bar" = "foobar"
test Xml.lns get "
" =
{ "#declaration"
{ "#attribute"
{ "version" = "1.0" }
}
}
{ "!DOCTYPE" = "catalog"
{ "PUBLIC"
{ "#literal" = "-//OASIS//DTD XML Catalogs V1.0//EN" }
{ "#literal" = "file:///usr/share/xml/schema/xml-core/catalog.dtd" }
}
}
{ "doc" = "#empty" }
test Xml.lns get "
" =
{ "oor:component-data" = "#empty"
{ "#attribute"
{ "xmlns:oor" = "http://openoffice.org/2001/registry" }
}
}
let input1 = "
Wiki
Augeas
Augeas is now able to parse XML files!
- Translate from XML to a tree syntax
- Translate from the tree back to XML
- this
"
test Xml.doc get input1 =
{ "#declaration"
{ "#attribute"
{ "version" = "1.0" }
{ "encoding" = "UTF-8" }
}
}
{ "html"
{ "#text" = "\n " }
{ "head"
{ "#text" = "\n " }
{ "title"
{ "#text" = "Wiki" }
}
{ "#text" = " " }
}
{ "#text" = " " }
{ "body"
{ "#text" = "
" }
{ "h1"
{ "#text" = "Augeas" }
}
{ "#text" = " " }
{ "p"
{ "#attribute"
{ "class" = "main" }
}
{ "#text" = "Augeas is now able to parse XML files!" }
}
{ "#text" = " " }
{ "ul"
{ "#text" = "\n " }
{ "li"
{ "#text" = "Translate from XML to a tree syntax" }
}
{ "#text" = " " }
{ "li"
{ "#text" = "Translate from the tree back to XML" }
}
{ "#text" = " " }
{ "#comment" = " this is some comment " }
{ "#text" = "
" }
{ "li"
{ "#text" = "this" }
}
{ "#text" = " " }
}
{ "#text" = " " }
}
}
test Xml.doc put input1 after rm "/html/body" =
"
Wiki
"
let ul1 = "
"
test Xml.doc get ul1 =
{ "ul"
{ "#text" = "
" }
{ "li"
{ "#text" = "test1" }
}
{ "#text" = " " }
{ "li"
{ "#text" = "test2" }
}
{ "#text" = " " }
{ "li"
{ "#text" = "test3" }
}
{ "#text" = " " }
{ "li"
{ "#text" = "test4" }
}
}
test Xml.doc put ul1 after set "/ul/li[3]/#text" "bidon" = "
"
test Xml.doc put ul1 after rm "/ul/li[2]" = "
"
(* #text nodes don't move when inserting a node, the result depends on where the node is added *)
test Xml.doc put ul1 after insb "a" "/ul/li[2]" = "
"
test Xml.doc put ul1 after insa "a" "/ul/li[1]" = "
"
(* Attributes must be added before text nodes *)
test Xml.doc put ul1 after insb "#attribute" "/ul/li[2]/#text";
set "/ul/li[2]/#attribute/bidon" "gazou";
set "/ul/li[2]/#attribute/foo" "bar" = "
"
(* if empty element is allowed to be as root, this test triggers error *)
test Xml.lns get "
" =
{ "doc"
{ "#text" = "\n" }
{ "a"
{ "c" = "#empty" }
{ "b"
{ "c" = "#empty" }
}
{ "c" = "#empty" }
{ "c" = "#empty" }
{ "a" }
}
}
let p01pass2 = "
]>
"
test Xml.lns get p01pass2 =
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "before document element" }
}
{ "#comment" = " comment after document element" }
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "before document element" }
}
{ "#comment" = " comment after document element" }
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "before document element" }
}
{ "#comment" = " comment after document element" }
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "before document element" }
}
{ "!DOCTYPE" = "doc"
{ "!ELEMENT" = "doc"
{ "#decl" = "ANY" }
}
{ "!ELEMENT" = "a"
{ "#decl" = "ANY" }
}
{ "!ELEMENT" = "b"
{ "#decl" = "ANY" }
}
{ "!ELEMENT" = "c"
{ "#decl" = "ANY" }
}
}
{ "doc"
{ "#text" = "
" }
{ "a"
{ "b"
{ "c" = "#empty" }
}
}
}
{ "#comment" = " comment after document element" }
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "after document element" }
}
{ "#comment" = " comment after document element" }
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "after document element" }
}
{ "#comment" = " comment after document element" }
{ "#pi"
{ "#target" = "PI" }
{ "#instruction" = "after document element" }
}
(* various valid Name constructions *)
test Xml.lns get "\n\n<::._-0/>\n<_:._-0/>\n\n<_/>\n<:/>\n" =
{ "doc"
{ "#text" = "\n" }
{ "A:._-0" = "#empty" }
{ "::._-0" = "#empty" }
{ "_:._-0" = "#empty" }
{ "A" = "#empty" }
{ "_" = "#empty" }
{ ":" = "#empty" }
}
test Xml.lns get "
" =
{ "doc"
{ "#text" = "\n" }
{ "abcdefghijklmnopqrstuvwxyz" = "#empty" }
{ "ABCDEFGHIJKLMNOPQRSTUVWXYZ" = "#empty" }
{ "A01234567890" = "#empty" }
{ "A.-:" = "#empty" }
}
let p06fail1 = "
]>
"
(* we accept this test because we do not verify XML references *)
test Xml.lns get p06fail1 =
{ "#comment" = "non-validating processors may pass this instance because they don't check the IDREFS attribute type" }
{ "!DOCTYPE" = "doc"
{ "!ELEMENT" = "doc"
{ "#decl" = "(a|refs)*" }
}
{ "!ELEMENT" = "a"
{ "#decl" = "EMPTY" }
}
{ "!ELEMENT" = "refs"
{ "#decl" = "EMPTY" }
}
{ "!ATTLIST" = "refs"
{ "1"
{ "#name" = "refs" }
{ "#type" = "IDREFS" }
{ "#REQUIRED" }
}
}
{ "!ATTLIST" = "a"
{ "1"
{ "#name" = "id" }
{ "#type" = "ID" }
{ "#REQUIRED" }
}
}
}
{ "doc"
{ "#text" = "
" }
{ "a" = "#empty"
{ "#attribute"
{ "id" = "A1" }
}
}
{ "a" = "#empty"
{ "#attribute"
{ "id" = "A2" }
}
}
{ "a" = "#empty"
{ "#attribute"
{ "id" = "A3" }
}
}
{ "refs" = "#empty"
{ "#attribute"
{ "refs" = "" }
}
}
}
(* we accept dquote, but not single quotes, because of resulting ambiguity *)
let p10pass1_1 = "'">\nasdf\n ?>%\"/>"
let p10pass1_2 = ""
test Xml.lns get p10pass1_1 =
{ "doc"
{ "A" = "#empty"
{ "#attribute"
{ "a" = "asdf>'">\nasdf\n ?>%" }
}
}
}
test Xml.lns get p10pass1_2 = *
(* here again, test exclude single quote *)
let p11pass1 = "
?>/\''\">
]>
"
test Xml.lns get p11pass1 =
{ "#comment" = "Inability to resolve a notation should not be reported as an error" }
{ "!DOCTYPE" = "doc"
{ "!ELEMENT" = "doc"
{ "#decl" = "EMPTY" }
}
{ "!NOTATION" = "not1"
{ "SYSTEM" = "a%a&b?>/\''" }
}
{ "!NOTATION" = "not3"
{ "SYSTEM" = "" }
}
}
{ "doc" }
test Xml.lns get "a%b%</doc></doc>]]<&" =
{ "doc"
{ "#text" = "a%b%</doc></doc>]]<&" }
}
let p15pass1 = "
"
test Xml.lns get p15pass1 =
{ "#comment" = "a
-<[ CDATA [
\"- -'-
-" }
{ "#comment" = "" }
{ "doc" }
let p22pass3 = "
"
test Xml.lns get p22pass3 =
{ "#declaration"
{ "#attribute"
{ "version" = "1.0" }
}
}
{ "#comment" = "comment" }
{ "#pi"
{ "#target" = "pi" }
{ "#instruction" = "some instruction" }
}
{ "doc"
{ "#pi"
{ "#target" = "pi" }
}
}
let p25pass2 = "
"
test Xml.lns get p25pass2 =
{ "#declaration"
{ "#attribute"
{ "version" = "1.0" }
}
}
{ "doc" }
test Xml.lns get "
]>
" =
{ "!DOCTYPE" = "doc"
{ "!ELEMENT" = "doc"
{ "#decl" = "EMPTY" }
}
}
{ "doc" }
test Xml.lns get "" = { "doc" }
test Xml.lns get "" =
{ "a"
{ "doc" = "#empty"
{ "#attribute"
{ "att" = "val" }
{ "att2" = "val2" }
{ "att3" = "val3" }
}
}
}
test Xml.lns get "" = { "doc" = "#empty" }
(* failure tests *)
(* only one document element *)
test Xml.lns get "" = *
(* document element must be complete *)
test Xml.lns get "" = *
(* emtpy document is rejected *)
test Xml.lns get "" = *
(* malformed element *)
test Xml.lns get "" = *
(* a Name cannot start with a digit *)
test Xml.lns get "<0A/>" = *
(* no space before "CDATA" *)
test Xml.lns get "" = *
(* no space after "CDATA" *)
test Xml.lns get "" = *
(* CDSect's can't nest *)
test Xml.lns get "
]]>
" = *
(* Comment is illegal in VersionInfo *)
test Xml.lns get " =\"1.0\"?>
" = *
(* only declarations in DTD *)
test Xml.lns get "
]>" = *
(* we do not support external entities *)
test Xml.lns get "\">
%eldecl;
]>
" = *