script: ignore stop words in top_words

This commit is contained in:
MorganGeek
2018-09-07 12:25:33 +02:00
parent f4da6da8df
commit 1c28474769
2 changed files with 321 additions and 1 deletions

View File

@ -1,3 +1,3 @@
#/usr/bin/env bash
BASEDIR=$(dirname "$0")
grep -o -E '[a-zA-Z]{3,}' "$BASEDIR/README.md" | tr A-Z a-z | sort | uniq -c | sort -n
grep -o -E '[a-zA-Z]{3,}' "$BASEDIR/README.md" | tr A-Z a-z | grep -vwFf stopwords.txt | sort | uniq -c | sort -n