File: isub.pl

package info (click to toggle)
swi-prolog 7.2.3%2Bdfsg-6
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 84,180 kB
  • ctags: 45,684
  • sloc: ansic: 330,358; perl: 268,104; sh: 6,795; java: 4,904; makefile: 4,561; cpp: 4,153; ruby: 1,594; yacc: 843; xml: 82; sed: 12; sql: 6
file content (67 lines) | stat: -rw-r--r-- 2,493 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
/*  Part of SWI-Prolog

    Author:        Giorgos Stoilos and Jan Wielemaker

    This program is free software; you can redistribute it and/or
    modify it under the terms of the GNU General Public License
    as published by the Free Software Foundation; either version 2
    of the License, or (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public
    License along with this library; if not, write to the Free Software
    Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA

    As a special exception, if you link this library with other files,
    compiled with a Free Software compiler, to produce an executable, this
    library does not by itself cause the resulting executable to be covered
    by the GNU General Public License. This exception does not however
    invalidate any other reasons why the executable file might be covered by
    the GNU General Public License.
*/

:- module(isub,
	  [ isub/4			% +Text1, +Text2, +Normalize, -Distance
	  ]).

:- use_foreign_library(foreign(isub)).

/** <module> isub: a string similarity measure

The library(isub) implements a similarity measure between strings, i.e.,
something similar to the _|Levenshtein distance|_.  This method is based
on the length of common substrings.

@author Giorgos Stoilos
@see	_|A string metric for ontology alignment|_ by Giorgos Stoilos,
	2005.
*/

%%	isub(+Text1:atomic, +Text2:atomic, +Normalize:bool,
%%	     -Similarity:float) is det.
%
%	Similarity is a measure for the distance between Text1 and
%	Text2.  E.g.
%
%	  ==
%	  ?- isub('E56.Language', 'languange', true, D).
%	  D = 0.711348.
%	  ==
%
%	If Normalize is =true=, isub/4   applies string normalization as
%	implemented by the original authors: Text1  and Text2 are mapped
%	to lowercase and the characters  "._   "  are removed. Lowercase
%	mapping is done  with  the   C-library  function  towlower(). In
%	general, the required normalization is   domain dependent and is
%	better left to the caller.  See e.g., unaccent_atom/2.
%
%	@param	Similarity is a float in the range [0.0..1.0], where 1.0
%		means _|most similar|_

:- multifile sandbox:safe_primitive/1.

sandbox:safe_primitive(isub:isub(_,_,_,_)).