pdftotext "$1" - \ | perl -CS -ne 'while (/(\p{L}+(?:-\p{L}+)*)/g) { print lc($1), "\n"; }' \ | awk 'length($0) >= 3' \ | sort \ | uniq -c \ | sort -nr