diff options
Diffstat (limited to 'awklib/eg/prog/wordfreq.awk')
-rw-r--r-- | awklib/eg/prog/wordfreq.awk | 13 |
1 files changed, 13 insertions, 0 deletions
diff --git a/awklib/eg/prog/wordfreq.awk b/awklib/eg/prog/wordfreq.awk new file mode 100644 index 00000000..b67fed47 --- /dev/null +++ b/awklib/eg/prog/wordfreq.awk @@ -0,0 +1,13 @@ +# Print list of word frequencies +{ + $0 = tolower($0) # remove case distinctions + gsub(/[^a-z0-9_ \t]/, "", $0) # remove punctuation + for (i = 1; i <= NF; i++) + freq[$i]++ +} +END { + sort = "sort +1 -nr" + for (word in freq) + printf "%s\t%d\n", word, freq[word] | sort + close(sort) +} |