summaryrefslogtreecommitdiff
path: root/utils/pdf2xml.dtd
blob: bf7f14f6cd9b1729beaacadcdcd8eecb0be991fe (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
<?xml version="1.0" encoding="UTF-8"?>
<!ELEMENT pdf2xml (page+, outline?)>
<!ATTLIST pdf2xml
	producer CDATA #REQUIRED
	version CDATA #REQUIRED
>
<!ELEMENT page (fontspec*, image*, text*)>
<!ATTLIST page
	number CDATA #REQUIRED
	position CDATA #REQUIRED
	top CDATA #REQUIRED
	left CDATA #REQUIRED
	height CDATA #REQUIRED
	width CDATA #REQUIRED
>
<!ELEMENT fontspec EMPTY>
<!ATTLIST fontspec
	id CDATA #REQUIRED
	size CDATA #REQUIRED
	family CDATA #REQUIRED
	color CDATA #REQUIRED
>
<!ELEMENT text (#PCDATA | b | i | a)*>
<!ATTLIST text
	top CDATA #REQUIRED
	left CDATA #REQUIRED
	width CDATA #REQUIRED
	height CDATA #REQUIRED
	font CDATA #REQUIRED
>
<!ELEMENT b (#PCDATA | i)*>
<!ELEMENT i (#PCDATA | b)*>
<!ELEMENT a (#PCDATA)>
<!ATTLIST a
    href CDATA #REQUIRED
>
<!ELEMENT image EMPTY>
<!ATTLIST image
	top CDATA #REQUIRED
	left CDATA #REQUIRED
	width CDATA #REQUIRED
	height CDATA #REQUIRED
	src CDATA #REQUIRED
>
<!ELEMENT outline (item | outline)*>
<!ELEMENT item (#PCDATA)>
<!ATTLIST item
	page CDATA #IMPLIED
>