freebsd-skq/contrib/awk/test/longwrds.awk
1997-10-14 18:17:11 +00:00

21 lines
455 B
Awk

# From Gawk Manual modified by bug fix and removal of punctuation
# Record every word which is used at least once
{
for (i = 1; i <= NF; i++) {
tmp = tolower($i)
if (0 != (pos = match(tmp, /([a-z]|-)+/)))
used[substr(tmp, pos, RLENGTH)] = 1
}
}
#Find a number of distinct words longer than 10 characters
END {
num_long_words = 0
for (x in used)
if (length(x) > 10) {
++num_long_words
print x
}
print num_long_words, "long words"
}