File: html_lexer-basic.ads

package info (click to toggle)
libopentoken 3.0b-5
  • links: PTS
  • area: main
  • in suites: etch, etch-m68k
  • size: 1,416 kB
  • ctags: 51
  • sloc: ada: 8,561; makefile: 120
file content (106 lines) | stat: -rw-r--r-- 5,307 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
-------------------------------------------------------------------------------
--
-- Copyright (C) 1999 Christoph Karl Walter Grein
--
-- This file is part of the OpenToken package.
--
-- The OpenToken package is free software; you can redistribute it and/or
-- modify it under the terms of the  GNU General Public License as published
-- by the Free Software Foundation; either version 2, or (at your option)
-- any later version. The OpenToken package is distributed in the hope that
-- it will be useful, but WITHOUT ANY WARRANTY; without even the implied
-- warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-- GNU General Public License for  more details.  You should have received
-- a copy of the GNU General Public License  distributed with the OpenToken
-- package;  see file GPL.txt.  If not, write to  the Free Software Foundation,
-- 59 Temple Place - Suite 330,  Boston, MA 02111-1307, USA.
--
-- As a special exception,  if other files  instantiate  generics from this
-- unit, or you link this unit with other files to produce an executable,
-- this unit does not by itself cause the resulting executable to be
-- covered by the GNU General Public License.  This exception does not
-- however invalidate any other reasons why the executable file might be
-- covered by the GNU Public License.
--
-- Maintainer: Christoph K. W. Grein (Christ-Usch.Grein@T-Online.de)
--
-- Update History:
-- $Log: html_lexer-basic.ads,v $
-- Revision 1.3  2000/08/07 00:21:17  Ted
-- Change to work w/ new package hierarchy
--
-- Revision 1.2  2000/01/27 21:22:35  Ted
-- Fix to work with 2.0 release
--
-- Revision 1.1  1999/12/27 21:41:56  Ted
-- Merged into OpenToken baseline
--
-- Revision 1.0  1999/12/21  Grein
-- Initial Version
--
-------------------------------------------------------------------------------

with Ada.Strings.Maps.Constants;

with OpenToken.Token.Enumerated.Analyzer;

with OpenToken.Recognizer.Bracketed_Comment;
with OpenToken.Recognizer.Character_Set;
with OpenToken.Recognizer.End_Of_File;
with OpenToken.Recognizer.HTML_Entity;
with OpenToken.Recognizer.Identifier;
with OpenToken.Recognizer.Nothing;

pragma Elaborate_All (OpenToken.Recognizer.Bracketed_Comment, OpenToken.Recognizer.Character_Set,
                      OpenToken.Recognizer.End_Of_File, OpenToken.Recognizer.HTML_Entity,
                      OpenToken.Recognizer.Identifier, OpenToken.Recognizer.Nothing);

private package HTML_Lexer.Basic is

   type Basic_Token is (Whitespace,
                        -- Comments <!-- anything -->
                        Comment,
                        -- Document Type Declaration <!DOCTYPE ... >
                        Doctype,
                        -- HTML tags like <A> or </A>
                        HTML_Tag,
                        -- Running text and entities like &amp;
                        Text, Entity,
                        -- Syntax error
                        Bad_Token,
                        --
                        End_Of_File);
   -- Note that sequence of tokens is relevant since among competing
   -- tokens the first one wins.

   package Master_Basic_Token is new OpenToken.Token.Enumerated (Basic_Token);
   package Tokenizer is new Master_Basic_Token.Analyzer;

   use type Ada.Strings.Maps.Character_Set;

   Syntax: constant Tokenizer.Syntax :=
     (Doctype     => Tokenizer.Get(OpenToken.Recognizer.Bracketed_Comment.Get
                                                           (Comment_Opener => "<!",
                                                            Comment_Closer => ">",
                                                            Reportable     => True)),
      HTML_Tag    => Tokenizer.Get(OpenToken.Recognizer.Bracketed_Comment.Get
                                                           (Comment_Opener => "<",
                                                            Comment_Closer => ">",
                                                            Reportable     => True)),
      Text        => Tokenizer.Get(OpenToken.Recognizer.Character_Set.Get
                                                       (Ada.Strings.Maps.Constants.Graphic_Set -
                                                        Ada.Strings.Maps.To_Set ("<>""&"),
                                                        Reportable => True)),
      Entity      => Tokenizer.Get(OpenToken.Recognizer.HTML_Entity.Get),
      Comment     => Tokenizer.Get(OpenToken.Recognizer.Bracketed_Comment.Get
                                                           (Comment_Opener => "<!--",
                                                            Comment_Closer => "-->",
                                                            Reportable => True)),
      Whitespace  => Tokenizer.Get(OpenToken.Recognizer.Character_Set.Get
                                                       (OpenToken.Recognizer.Character_Set.Standard_Whitespace)),
      Bad_Token   => Tokenizer.Get(OpenToken.Recognizer.Nothing.Get),
      End_Of_File => Tokenizer.Get(OpenToken.Recognizer.End_Of_File.Get));

   Analyzer: Tokenizer.Instance := Tokenizer.Initialize (Syntax, Default => Bad_Token);

end HTML_Lexer.Basic;