File: dupword.awk

package info (click to toggle)
gawk 1%3A4.1.1%2Bdfsg-1
  • links: PTS
  • area: main
  • in suites: jessie, jessie-kfreebsd
  • size: 15,604 kB
  • ctags: 5,728
  • sloc: ansic: 47,935; sh: 12,995; awk: 10,263; yacc: 5,815; makefile: 2,279; sed: 121
file content (21 lines) | stat: -rw-r--r-- 507 bytes parent folder | download | duplicates (8)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# dupword.awk --- find duplicate words in text
#
# Arnold Robbins, arnold@skeeve.com, Public Domain
# December 1991
# Revised October 2000

{
    $0 = tolower($0)
    gsub(/[^[:alnum:][:blank:]]/, " ");
    $0 = $0         # re-split
    if (NF == 0)
        next
    if ($1 == prev)
        printf("%s:%d: duplicate %s\n",
            FILENAME, FNR, $1)
    for (i = 2; i <= NF; i++)
        if ($i == $(i-1))
            printf("%s:%d: duplicate %s\n",
                FILENAME, FNR, $i)
    prev = $NF
}