File: example.dtd

package info (click to toggle)
gocr 0.52-6.1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,864 kB
  • sloc: ansic: 18,197; sh: 545; makefile: 339; xml: 20
file content (53 lines) | stat: -rw-r--r-- 1,704 bytes parent folder | download | duplicates (9)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
<?xml version="1.0"?>
<!--
    first draft by Volker Simonis, reviewed by Joerg Schulenburg
                 Its not ready for use!
     ToDo:
       - lynx/links/w3c should show xml like a html file 
           value as <character ...>CharText</character>
           or  <word><character ...></character><...>WordText</word>
           or as line or as block? whats more useful?
       - how to code table of alternative chars/words and its probability?
       - how to handle images (as image tags?)
       - xmllint -\-htmlout -\-loaddtd jocr/doc/example.dtd o.xml
  -->
<!ENTITY % default.attributes "x  CDATA #REQUIRED
                               y  CDATA #REQUIRED
                               dx CDATA #REQUIRED
                               dy CDATA #REQUIRED">

<!ELEMENT box EMPTY>
<!ATTLIST box %default.attributes;
              value CDATA #REQUIRED;>

<!ELEMENT barcode EMPTY>
<!ATTLIST barcode %default.attributes;
                value CDATA #REQUIRED;>

<!ELEMENT img EMPTY>
<!ATTLIST img %default.attributes;>

<!ELEMENT page (block*)>
<!ATTLIST page %default.attributes;>

<!ELEMENT block (line*)>
<!ATTLIST block %default.attributes;>

<!ELEMENT line ((word | space | punctuation-mark)*)>
<!ATTLIST line %default.attributes;>

<!ELEMENT word (character*)>
<!ATTLIST word %default.attributes;>

<!ELEMENT char EMPTY>
<!ATTLIST char %default.attributes;
               value CDATA #REQUIRED;
               (#CDATA)>   <!-- is that correct? -->

<!ELEMENT space EMPTY>
<!ATTLIST space %default.attributes;
                value CDATA #REQUIRED;>

<!ELEMENT punctuation-mark EMPTY>
<!ATTLIST punctuation-mark %default.attributes;
                           value CDATA #REQUIRED;>