#!/bin/sh
# breaking a file to words, 1.1v (c) Lszl Nmeth, BSD License
# fix tabulator, ISO-8859-2, etc. problems
case $# in
 0) echo "break file(s)"; exit 0;;
esac
cat $@ | 
tr -cd '[^a-zA-Z\241-\254\256-\326\330-\366\370-\377/ \t\n\-:(),]' | # ISO-8859-2
tr ' /-:(),\t' '\n' | 
sort | 
uniq
