Skip to content

Commit

Permalink
update build script and rebuild wordlists
Browse files Browse the repository at this point in the history
  • Loading branch information
ynsrc committed May 25, 2024
1 parent 113d02b commit 5d86f99
Show file tree
Hide file tree
Showing 16 changed files with 86 additions and 2,250 deletions.
51 changes: 50 additions & 1 deletion build.sh
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,56 @@ done
for wlfile in $(echo build/*.txt);
do
filename=$(basename $wlfile)
cat $wlfile | sort -u > "${TARGET}/$filename"

case $filename in
adjective.txt | adverb.txt | article.txt)
cat $wlfile | grep -vE '[…’\.\(]' | sort -u > "${TARGET}/$filename"
;;

affix-prefix.txt)
cat $wlfile | grep -E '^.*-$' | sort -u > "${TARGET}/$filename"
;;

affix-suffix.txt)
cat $wlfile | grep -E '^-' | tr '.…' '-' | tr -s '-' | grep '^-' | sort -u > "${TARGET}/$filename"
;;

comparative.txt)
cat $wlfile | grep -vE '^-' | sort -u > "${TARGET}/$filename"
;;

expression-multi-word.txt)
cat $wlfile | grep -v 'à' | sort -u > "${TARGET}/$filename"
;;

interjection.txt)
cat $wlfile | grep -vE '[à’,]' | tr -d '!' | sort -u > "${TARGET}/$filename"
;;

noun-das.txt | noun-der.txt | noun-die.txt)
cat $wlfile | grep -vE '^\.|[…\*\+\ǃ’„“§]' | sort -u > "${TARGET}/$filename"
;;

noun-plural.txt)
cat $wlfile | grep -vE '…|\(' | sort -u > "${TARGET}/$filename"
;;

number-cardinal.txt | number-ordinal.txt)
cat $wlfile | grep -vE '^\.|…' | sort -u > "${TARGET}/$filename"
;;

particle.txt)
cat $wlfile | grep -vE '^\.|[\.-]$|[…à]' | sort -u > "${TARGET}/$filename"
;;

verb.txt)
cat $wlfile | grep -vE '^\.|…' | tr -d '()' | sort -u > "${TARGET}/$filename"
;;

*)
cat $wlfile | sort -u > "${TARGET}/$filename"
;;
esac
done

tar cvzf build/wordlists.tar.gz v1/*.txt README.md LICENSE
Loading

0 comments on commit 5d86f99

Please sign in to comment.