File: htmlscan.mli

package info (click to toggle)
spamoracle 1.4-12
  • links: PTS, VCS
  • area: main
  • in suites: lenny
  • size: 256 kB
  • ctags: 245
  • sloc: ml: 1,198; makefile: 145; sh: 74
file content (18 lines) | stat: -rw-r--r-- 1,035 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
(***********************************************************************)
(*                                                                     *)
(*                 SpamOracle -- a Bayesian spam filter                *)
(*                                                                     *)
(*            Xavier Leroy, projet Cristal, INRIA Rocquencourt         *)
(*                                                                     *)
(*  Copyright 2002 Institut National de Recherche en Informatique et   *)
(*  en Automatique.  This file is distributed under the terms of the   *)
(*  GNU Public License version 2, http://www.gnu.org/licenses/gpl.txt  *)
(*                                                                     *)
(***********************************************************************)

(* $Id: htmlscan.mli,v 1.1 2003/01/02 08:52:15 xleroy Exp $ *)

(** Approximate HTML scanner.  Extracts words and certain parameters
    of certain tags (e.g. URLs) from HTML text. *)

val extract_text: string -> string