diff options
Diffstat (limited to 'spelling')
-rwxr-xr-x | spelling/check-spelling.sh | 21 | ||||
-rw-r--r-- | spelling/en.txt | 33 | ||||
-rw-r--r-- | spelling/en_US.aff.txt | 10 | ||||
-rw-r--r-- | spelling/en_US.dic.txt | 11 | ||||
-rw-r--r-- | spelling/fr.txt | 8 | ||||
-rw-r--r-- | spelling/fr_FR.dic.txt | 1 | ||||
-rw-r--r-- | spelling/international.dic.txt | 50 | ||||
-rw-r--r-- | spelling/international.txt | 106 | ||||
-rw-r--r-- | spelling/pt.txt | 123 | ||||
-rw-r--r-- | spelling/pt_BR.dic.txt | 2 |
10 files changed, 280 insertions, 85 deletions
diff --git a/spelling/check-spelling.sh b/spelling/check-spelling.sh index 653a5f9..3ddfd2a 100755 --- a/spelling/check-spelling.sh +++ b/spelling/check-spelling.sh @@ -11,22 +11,21 @@ HTML_DIR="${1:-}" export LANG=C.UTF-8 for DICT in spelling/*.txt; do - diff <(sort "$DICT") "$DICT" || { + diff <(sort "$DICT" | uniq) "$DICT" || { echo "The $DICT dictionary is unsorted. To fix it, run:" >&2 - echo " LANG=C.UTF-8 sort $DICT | sponge $DICT" >&2 + echo " LANG=C.UTF-8 sort $DICT | uniq | sponge $DICT" >&2 exit 1 } done -finish() { - rm -f spelling.txt - rm -f dicts.txt -} -trap finish EXIT - -cat spelling/*.txt > dicts.txt - -find "${HTML_DIR}" -type f -name '*.html' | grep -v pastebin | hunspell -l -p dicts.txt -d fr_FR -d en_US -i utf-8 >> spelling.txt +rm -f spelling.txt +shopt -s globstar +for f in "${HTML_DIR}"/**/*.html; do + if ! grep -E '/pastebin(/|s.html)' <(echo "$f") > /dev/null; then + l="$(head -n2 "$f" | tail -n1 | cut -d\" -f2)" + hunspell -u3 -H -d "$l" -p <(cat spelling/international.txt "spelling/$l.txt") "$f" | tee -a spelling.txt + fi +done if [[ -s spelling.txt ]]; then printf "\nvvv Mispelled words detected by hunspell.\n\n" >&2 diff --git a/spelling/en.txt b/spelling/en.txt new file mode 100644 index 0000000..b4a2e52 --- /dev/null +++ b/spelling/en.txt @@ -0,0 +1,33 @@ +aren +autocommit +couldn +curation +declaratively +decrypting +didn +doesn +duplications +embeddable +filesystem +filesystems +isn +maintainence +oday +portuguese +portuguse +pre +programmatically +realising +reimplementation +repo +reproducibility +scriptable +shouldn +symlinks +syncable +só +tradeoffs +untrusted +ve +wasn +wouldn diff --git a/spelling/en_US.aff.txt b/spelling/en_US.aff.txt deleted file mode 100644 index 827c34f..0000000 --- a/spelling/en_US.aff.txt +++ /dev/null @@ -1,10 +0,0 @@ -aren -couldn -didn -doesn -isn -pre -sr -ve -wasn -wouldn diff --git a/spelling/en_US.dic.txt b/spelling/en_US.dic.txt deleted file mode 100644 index 90a7531..0000000 --- a/spelling/en_US.dic.txt +++ /dev/null @@ -1,11 +0,0 @@ -autocommit -curation -declaratively -decrypting -programmatically -realising -repo -reproducibility -scriptable -symlinks -tradeoffs diff --git a/spelling/fr.txt b/spelling/fr.txt new file mode 100644 index 0000000..aa09184 --- /dev/null +++ b/spelling/fr.txt @@ -0,0 +1,8 @@ +' +AJA +dimanche +earned +oday +ppris +só +ujourd'hui diff --git a/spelling/fr_FR.dic.txt b/spelling/fr_FR.dic.txt deleted file mode 100644 index b402cff..0000000 --- a/spelling/fr_FR.dic.txt +++ /dev/null @@ -1 +0,0 @@ -dimanche diff --git a/spelling/international.dic.txt b/spelling/international.dic.txt deleted file mode 100644 index f3637be..0000000 --- a/spelling/international.dic.txt +++ /dev/null @@ -1,50 +0,0 @@ -144p -250GB -32GB -500GB -81F90EC3CD356060 -8GB -André -BSON -CI -EuAndreh -Fastmail -GPLv3 -GitLab -Gmail -GuixSD -JS -Lerna -Matroska -Merkle -NPM -Nextcloud -NixOS -Pastebin -Raku -SSD -Sourcehut -Spacemacs -Staltz -VPN -Yandex -YouTube -brainer -buildGoModule -ci -dl -guix -html -i5 -i7 -intbytes -js -libre -merkle -myrepos -nixos -no-brainer -npm -touchpad -v8 -youtube diff --git a/spelling/international.txt b/spelling/international.txt new file mode 100644 index 0000000..a12f150 --- /dev/null +++ b/spelling/international.txt @@ -0,0 +1,106 @@ +144p +250GB +32GB +500GB +81F90EC3CD356060 +8GB +André +Atom +B1 +BN +BSON +BY +BY-SA +CI +Cantrill +CouchDB +Datomic +EuAndreh +F +FFI +Fastmail +GPLv +GPLv3 +GTK +GitLab +Gmail +GuixSD +Halloway +IndexedDB +JS +Joyent +L1 +LaTeX +Lerna +LilyPond +Matroska +Mentat +Merkle +NPM +Nextcloud +NixOS +POSIX +Pastebin +PouchDB +RSS +Raku +SA +SSD +Sourcehut +Spacemacs +StackOverflow +Staltz +TAB +TBs +VPN +WebAssembly +Yandex +YouTube +Zig +boneco +brainer +buildGoModule +cgit +ci +datalog +datom +datoms +dl +en +euandreh +fr +gcrypt +gt +guix +guixbuild +h1 +h6 +hinarioespirita +html +i5 +i7 +intbytes +jekyll +jemoji +js +kramdown +libre +lt +merkle +myrepos +nixos +no-brainer +npm +org +pastebin +pastebins +plaintext +pt +songbooks +sourcehut +sr +systemd +touchpad +v8 +xyz +youtube diff --git a/spelling/pt.txt b/spelling/pt.txt new file mode 100644 index 0000000..07202d4 --- /dev/null +++ b/spelling/pt.txt @@ -0,0 +1,123 @@ +Abaixo +Agosto +Anna +Aprendi +Blog +Cópia +H +HEA +I +L +Lista +Me +Postado +Postagens +Quando +T +Usar +Visite +Website +achar +arquivo +artigos +buscar +chegar +comece +comentário +como +completar +conhecimentos +contatar +criar +código +da +dados +de +desta +diretamente +direto +discussão +discussões +distribuir +do +dobráveis +dou eu +e +earned +email +empacotá +encontra +engasgo +entrada +envelope +escreva +escrever +escrevo +esforço +estou +eu +existentes +extra +fazer +ficou +formatos +gerar +impressão +inglês +interessantes +internet +intervalos +jeito +las +licenciado +licença +log +los +mandar +mande +me +mensagem +na +navegador +no +nome +normalmente +novo +o +oday +oje +ordená +os +padrão +para +parar +pessoal +por +post +postagens +prendi +procurando +procure +produção +projetos +pública +público +relacionados +reler +religioso +se +significa +simples +sobre +tempo +texto +timestamp +transpor +u +usando +usar +versão +versões +Ícone +é +úteis diff --git a/spelling/pt_BR.dic.txt b/spelling/pt_BR.dic.txt deleted file mode 100644 index 7ed8a57..0000000 --- a/spelling/pt_BR.dic.txt +++ /dev/null @@ -1,2 +0,0 @@ -os -sobre |