aboutsummaryrefslogtreecommitdiff
path: root/spelling
diff options
context:
space:
mode:
Diffstat (limited to 'spelling')
-rwxr-xr-xspelling/check-spelling.sh21
-rw-r--r--spelling/en.txt33
-rw-r--r--spelling/en_US.aff.txt10
-rw-r--r--spelling/en_US.dic.txt11
-rw-r--r--spelling/fr.txt8
-rw-r--r--spelling/fr_FR.dic.txt1
-rw-r--r--spelling/international.dic.txt50
-rw-r--r--spelling/international.txt106
-rw-r--r--spelling/pt.txt123
-rw-r--r--spelling/pt_BR.dic.txt2
10 files changed, 280 insertions, 85 deletions
diff --git a/spelling/check-spelling.sh b/spelling/check-spelling.sh
index 653a5f9..3ddfd2a 100755
--- a/spelling/check-spelling.sh
+++ b/spelling/check-spelling.sh
@@ -11,22 +11,21 @@ HTML_DIR="${1:-}"
export LANG=C.UTF-8
for DICT in spelling/*.txt; do
- diff <(sort "$DICT") "$DICT" || {
+ diff <(sort "$DICT" | uniq) "$DICT" || {
echo "The $DICT dictionary is unsorted. To fix it, run:" >&2
- echo " LANG=C.UTF-8 sort $DICT | sponge $DICT" >&2
+ echo " LANG=C.UTF-8 sort $DICT | uniq | sponge $DICT" >&2
exit 1
}
done
-finish() {
- rm -f spelling.txt
- rm -f dicts.txt
-}
-trap finish EXIT
-
-cat spelling/*.txt > dicts.txt
-
-find "${HTML_DIR}" -type f -name '*.html' | grep -v pastebin | hunspell -l -p dicts.txt -d fr_FR -d en_US -i utf-8 >> spelling.txt
+rm -f spelling.txt
+shopt -s globstar
+for f in "${HTML_DIR}"/**/*.html; do
+ if ! grep -E '/pastebin(/|s.html)' <(echo "$f") > /dev/null; then
+ l="$(head -n2 "$f" | tail -n1 | cut -d\" -f2)"
+ hunspell -u3 -H -d "$l" -p <(cat spelling/international.txt "spelling/$l.txt") "$f" | tee -a spelling.txt
+ fi
+done
if [[ -s spelling.txt ]]; then
printf "\nvvv Mispelled words detected by hunspell.\n\n" >&2
diff --git a/spelling/en.txt b/spelling/en.txt
new file mode 100644
index 0000000..b4a2e52
--- /dev/null
+++ b/spelling/en.txt
@@ -0,0 +1,33 @@
+aren
+autocommit
+couldn
+curation
+declaratively
+decrypting
+didn
+doesn
+duplications
+embeddable
+filesystem
+filesystems
+isn
+maintainence
+oday
+portuguese
+portuguse
+pre
+programmatically
+realising
+reimplementation
+repo
+reproducibility
+scriptable
+shouldn
+symlinks
+syncable
+só
+tradeoffs
+untrusted
+ve
+wasn
+wouldn
diff --git a/spelling/en_US.aff.txt b/spelling/en_US.aff.txt
deleted file mode 100644
index 827c34f..0000000
--- a/spelling/en_US.aff.txt
+++ /dev/null
@@ -1,10 +0,0 @@
-aren
-couldn
-didn
-doesn
-isn
-pre
-sr
-ve
-wasn
-wouldn
diff --git a/spelling/en_US.dic.txt b/spelling/en_US.dic.txt
deleted file mode 100644
index 90a7531..0000000
--- a/spelling/en_US.dic.txt
+++ /dev/null
@@ -1,11 +0,0 @@
-autocommit
-curation
-declaratively
-decrypting
-programmatically
-realising
-repo
-reproducibility
-scriptable
-symlinks
-tradeoffs
diff --git a/spelling/fr.txt b/spelling/fr.txt
new file mode 100644
index 0000000..aa09184
--- /dev/null
+++ b/spelling/fr.txt
@@ -0,0 +1,8 @@
+'
+AJA
+dimanche
+earned
+oday
+ppris
+só
+ujourd'hui
diff --git a/spelling/fr_FR.dic.txt b/spelling/fr_FR.dic.txt
deleted file mode 100644
index b402cff..0000000
--- a/spelling/fr_FR.dic.txt
+++ /dev/null
@@ -1 +0,0 @@
-dimanche
diff --git a/spelling/international.dic.txt b/spelling/international.dic.txt
deleted file mode 100644
index f3637be..0000000
--- a/spelling/international.dic.txt
+++ /dev/null
@@ -1,50 +0,0 @@
-144p
-250GB
-32GB
-500GB
-81F90EC3CD356060
-8GB
-André
-BSON
-CI
-EuAndreh
-Fastmail
-GPLv3
-GitLab
-Gmail
-GuixSD
-JS
-Lerna
-Matroska
-Merkle
-NPM
-Nextcloud
-NixOS
-Pastebin
-Raku
-SSD
-Sourcehut
-Spacemacs
-Staltz
-VPN
-Yandex
-YouTube
-brainer
-buildGoModule
-ci
-dl
-guix
-html
-i5
-i7
-intbytes
-js
-libre
-merkle
-myrepos
-nixos
-no-brainer
-npm
-touchpad
-v8
-youtube
diff --git a/spelling/international.txt b/spelling/international.txt
new file mode 100644
index 0000000..a12f150
--- /dev/null
+++ b/spelling/international.txt
@@ -0,0 +1,106 @@
+144p
+250GB
+32GB
+500GB
+81F90EC3CD356060
+8GB
+André
+Atom
+B1
+BN
+BSON
+BY
+BY-SA
+CI
+Cantrill
+CouchDB
+Datomic
+EuAndreh
+F
+FFI
+Fastmail
+GPLv
+GPLv3
+GTK
+GitLab
+Gmail
+GuixSD
+Halloway
+IndexedDB
+JS
+Joyent
+L1
+LaTeX
+Lerna
+LilyPond
+Matroska
+Mentat
+Merkle
+NPM
+Nextcloud
+NixOS
+POSIX
+Pastebin
+PouchDB
+RSS
+Raku
+SA
+SSD
+Sourcehut
+Spacemacs
+StackOverflow
+Staltz
+TAB
+TBs
+VPN
+WebAssembly
+Yandex
+YouTube
+Zig
+boneco
+brainer
+buildGoModule
+cgit
+ci
+datalog
+datom
+datoms
+dl
+en
+euandreh
+fr
+gcrypt
+gt
+guix
+guixbuild
+h1
+h6
+hinarioespirita
+html
+i5
+i7
+intbytes
+jekyll
+jemoji
+js
+kramdown
+libre
+lt
+merkle
+myrepos
+nixos
+no-brainer
+npm
+org
+pastebin
+pastebins
+plaintext
+pt
+songbooks
+sourcehut
+sr
+systemd
+touchpad
+v8
+xyz
+youtube
diff --git a/spelling/pt.txt b/spelling/pt.txt
new file mode 100644
index 0000000..07202d4
--- /dev/null
+++ b/spelling/pt.txt
@@ -0,0 +1,123 @@
+Abaixo
+Agosto
+Anna
+Aprendi
+Blog
+Cópia
+H
+HEA
+I
+L
+Lista
+Me
+Postado
+Postagens
+Quando
+T
+Usar
+Visite
+Website
+achar
+arquivo
+artigos
+buscar
+chegar
+comece
+comentário
+como
+completar
+conhecimentos
+contatar
+criar
+código
+da
+dados
+de
+desta
+diretamente
+direto
+discussão
+discussões
+distribuir
+do
+dobráveis
+dou eu
+e
+earned
+email
+empacotá
+encontra
+engasgo
+entrada
+envelope
+escreva
+escrever
+escrevo
+esforço
+estou
+eu
+existentes
+extra
+fazer
+ficou
+formatos
+gerar
+impressão
+inglês
+interessantes
+internet
+intervalos
+jeito
+las
+licenciado
+licença
+log
+los
+mandar
+mande
+me
+mensagem
+na
+navegador
+no
+nome
+normalmente
+novo
+o
+oday
+oje
+ordená
+os
+padrão
+para
+parar
+pessoal
+por
+post
+postagens
+prendi
+procurando
+procure
+produção
+projetos
+pública
+público
+relacionados
+reler
+religioso
+se
+significa
+simples
+sobre
+tempo
+texto
+timestamp
+transpor
+u
+usando
+usar
+versão
+versões
+Ícone
+úteis
diff --git a/spelling/pt_BR.dic.txt b/spelling/pt_BR.dic.txt
deleted file mode 100644
index 7ed8a57..0000000
--- a/spelling/pt_BR.dic.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-os
-sobre