File: dupword.awk

package info (click to toggle)
gawk 3.0.3-1
  • links: PTS
  • area: main
  • in suites: hamm, slink
  • size: 4,520 kB
  • ctags: 2,175
  • sloc: ansic: 20,481; awk: 2,476; yacc: 2,039; makefile: 877; sh: 409
file content (16 lines) | stat: -rw-r--r-- 414 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
# dupword --- find duplicate words in text
# Arnold Robbins, arnold@gnu.ai.mit.edu, Public Domain
# December 1991

{
    $0 = tolower($0)
    gsub(/[^A-Za-z0-9 \t]/, "");
    if ($1 == prev)
        printf("%s:%d: duplicate %s\n",
            FILENAME, FNR, $1)
    for (i = 2; i <= NF; i++)
        if ($i == $(i-1))
            printf("%s:%d: duplicate %s\n",
                FILENAME, FNR, $i)
    prev = $NF
}