docs/bib-ref2

view stuff/wordfreq @ 60:ab0bbc4264e3

PB: added an abstract
author markus schnalke <meillo@marmaro.de>
date Wed, 05 Nov 2014 07:37:06 +0100
parents
children
line source
1 #!/bin/sh
2 #
3 # print word frequency
5 deroff "$@" |
6 tr -c 'A-Za-zÄÖÜäöüß-' '\n' | tr A-ZÄÖÜ a-zäöü |
7 sed '/^ *$/d'| sort |uniq -c | awk '
8 {sum+=$1; a[$2]=$1;}
9 END {for (x in a) {printf("%s\t%.2f\t%4d\n", x, a[x]/sum, a[x])} }
10 '| sort -nr -k 3