File: basic.punctuation.lexc

package info (click to toggle)
hfst 3.16.2-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 14,532 kB
  • sloc: cpp: 101,875; sh: 6,717; python: 5,225; yacc: 4,985; lex: 2,900; makefile: 2,017; xml: 6
file content (68 lines) | stat: -rw-r--r-- 1,396 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
! Ripped and simplified from North sámi material: testing that lexer eats
! punctuation properly

Multichar_Symbols +PUNCT

LEXICON Root
,+PUNCT:,  # ;
.+PUNCT:.  # ;
..+PUNCT:..   # ;
...+PUNCT:...   # ;
?+PUNCT:?  # ; 
…+PUNCT:…  # ;
¿+PUNCT:¿  # ;
¶+PUNCT:¶  # ;
§+PUNCT:§  # ;
§§+PUNCT:§§ # ;
$+PUNCT:$  # ;
€+PUNCT:€  # ;
£+PUNCT:£  # ;
®+PUNCT:®  # ;
©+PUNCT:©  # ;

•+PUNCT:•  # ; !U+2022 Bullet
●+PUNCT:●  # ; !U+25CF Black circle
·+PUNCT:·  # ; !U+0097 Middle dot
ּ+PUNCT:ּ   # ; !U+05BC Hebrew (sic!) middle dot
·+PUNCT:·  # ; !U+0387, Greek (sic!) middle dot, or rather semicolon, in Greek.
-+PUNCT:-  # ; !hyphen
--+PUNCT:--  # ; !double hyphen
–+PUNCT:–  # ; !endash
—+PUNCT:—  # ; !emdash
―+PUNCT:―  # ; !horizontal bar U+2015
=+PUNCT:=  # ;
≈+PUNCT:≈  # ;
&+PUNCT:&  # ;
'+PUNCT:'  # ;
*+PUNCT:*  # ;
++PUNCT:+  # ;
±+PUNCT:±  # ;
`+PUNCT:`  # ;
´+PUNCT:´  # ;
/+PUNCT:/  # ; 
+/-+PUNCT:+/- # ;
~+PUNCT:~	  # ;
«+PUNCT:«  # ;
»+PUNCT:»  # ;
“+PUNCT:“  # ;
”+PUNCT:”  # ;
‘+PUNCT:‘  # ;
’+PUNCT:’  # ;
„+PUNCT:„  # ;
‹+PUNCT:‹  # ;
›+PUNCT:›  # ;
(+PUNCT:(  # ;
)+PUNCT:)  # ;
[+PUNCT:[  # ;
]+PUNCT:]  # ;
{+PUNCT:{  # ;
}+PUNCT:}  # ;
! escape required
%"+PUNCT:%"  # ;
%!+PUNCT:%!  # ;
%<+PUNCT:%<  # ;
%>+PUNCT:%>  # ;
%%+PUNCT:%%  # ;
%:+PUNCT:%:  # ;
%;+PUNCT:%;  # ;
%#+PUNCT:%#  # ;