File: html_chars.mll

package info (click to toggle)
hlins 0.40-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 484 kB
  • sloc: ml: 1,215; makefile: 148; sh: 4
file content (123 lines) | stat: -rw-r--r-- 4,335 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
(***************************************************************************)
(*  HLins: insert http-links into HTML documents.                          *)
(*  See http://www.lri.fr/~treinen/hlins                                   *)
(*                                                                         *)
(*  Copyright (C) 1999-2024 Ralf Treinen <treinen@irif.fr>                 *)
(*                                                                         *)
(*  This program is free software; you can redistribute it and/or modify   *)
(*  it under the terms of the GNU General Public License as published by   *)
(*  the Free Software Foundation; either version 2 of the License, or (at  *)
(*  your option) any later version.                                        *)
(*                                                                         *)
(*  This program is distributed in the hope that it will be useful, but    *)
(*  WITHOUT ANY WARRANTY; without even the implied warranty of             *)
(*  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU      *)
(*  General Public License for more details.                               *)
(*                                                                         *)
(*  You should have received a copy of the GNU General Public License      *)
(*  along with this program; if not, write to the Free Software            *)
(*  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307    *)
(*  USA                                                                    *)
(*                                                                         *)
(***************************************************************************)

(*
    HLins: insert http-links into HTML documents.
    See http://www.lri.fr/~treinen/hlins

    Copyright (C) 1999 Ralf Treinen <treinen@lri.fr>

    This program is free software; you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation; either version 2 of the License, or
    (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with this program; if not, write to the Free Software
    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

*)

{
open Lexing;;

(* translates an html character representation "&#nnn;" to the 
   corresponding 8-bit char.
*)
let special_to_char s = Char.chr (int_of_string (String.sub s 2 3))
;;

}


rule next_char = parse
  | "&Agrave;"	{ '' }
  | "&Aacute;"	{ '' }
  | "&Acirc;"	{ '' }
  | "&Atilde;"	{ '' }
  | "&Auml;"	{ '' }
  | "&Aring;"	{ '' }
  | "&AElig;"	{ '' }
  | "&Egrave;"	{ '' }
  | "&Eacute;"	{ '' }
  | "&Ecirc;"	{ '' }
  | "&Euml;"	{ '' }
  | "&Igrave;"	{ '' }
  | "&Iacute;"	{ '' }
  | "&Icirc;"	{ '' }
  | "&Iuml;"	{ '' }
  | "&ETH;"	{ '' }
  | "&Ntilde;"	{ '' }
  | "&Ograve;"	{ '' }
  | "&Oacute;"	{ '' }
  | "&Ocirc;"	{ '' }
  | "&Otilde;"	{ '' }
  | "&Ouml;"	{ '' }
  | "&Oslash;"	{ '' }
  | "&Ugrave;"	{ '' }
  | "&Uacute;"	{ '' }
  | "&Ucirc;"	{ '' }
  | "&Uuml;"	{ '' }
  | "&Yacute;"	{ '' }
  | "&THORN;"	{ '' }
  | "&szlig;"	{ '' }
  | "&agrave;"	{ '' }
  | "&aacute;"	{ '' }
  | "&acirc;"	{ '' }
  | "&atilde;"	{ '' }
  | "&auml;"	{ '' }
  | "&aring;"	{ '' }
  | "&aelig;"	{ '' }
  | "&ccdil;"	{ '' }
  | "&egrave;"	{ '' }
  | "&eacute;"	{ '' }
  | "&ecirc;"	{ '' }
  | "&euml;"	{ '' }
  | "&igrave;"	{ '' }
  | "&iacute;"	{ '' }
  | "&icirc;"	{ '' }
  | "&iuml;"	{ '' }
  | "&eth;"	{ '' }
  | "&ntilde;"	{ '' }
  | "&ograve;"	{ '' }
  | "&oacute;"	{ '' }
  | "&ocirc;"	{ '' }
  | "&otilde;"	{ '' }
  | "&ugrave;"	{ '' }
  | "&uacute;"	{ '' }
  | "&ucirc;"	{ '' }
  | "&uuml;"	{ '' }
  | "&yacute;"	{ '' }
  | "&thorn;"	{ '' }
      (* special chaarcters between 192 and 255 *)
  | "&#" ( "19"['2'-'9'] | '2'['0'-'4']['0'-'9'] | "25"['0'-'5'] ) ";"
      { special_to_char (lexeme lexbuf) }
  |  eof		{ raise End_of_file }
  | _             { lexeme_char lexbuf 0}