digitalist · March 21, 2021 08:07
diff --git a/gistfile1.txt b/gistfile1.txt
 # todo: clean utf chars with tr
 find -name '*.html' -exec html2text {} \; | tr -s '[[:punct:][:space:]]' '\n' | tr '[:upper:]' '[:lower:]' | sort | uniq -c | sort -bnr > ~/temp/words.txt
	# todo: clean utf chars with tr
	find -name '*.html' -exec html2text {} \; \| tr -s '[[:punct:][:space:]]' '\n' \| tr '[:upper:]' '[:lower:]' \| sort \| uniq -c \| sort -bnr > ~/temp/words.txt