#!/bin/bash WORDS="$(mktemp)" UNIQ="$(mktemp)" COUNTS="$(mktemp)" cat /dev/stdin | iconv -c -f UTF-8 -t EUCJP | mecab | iconv -c -f EUCJP -t UTF-8 \ | sed '/EOS/d' | sed '/^$/d' | awk -F ',' '{ print $7 }' > $WORDS cat $WORDS | sort | uniq > $UNIQ cat $UNIQ | while read LINE do FIRST=$(cat $WORDS | grep -n --color=never "$LINE" | head -n 1 | sed 's/:.*//') COUNT=$(cat $WORDS | grep -c -x "$LINE") echo -e "$COUNT\t$FIRST\t$LINE" >> $COUNTS done sort -n -r $COUNTS | cut -d" " -f1,3