Skip to content

Commit

Permalink
Merge pull request #2662 from perl6/coke/clean-spell
Browse files Browse the repository at this point in the history
Remove unused words (and provide utility to find them)
  • Loading branch information
coke authored Mar 13, 2019
2 parents 352c3d7 + 01dca5d commit 5683411
Show file tree
Hide file tree
Showing 3 changed files with 67 additions and 212 deletions.
67 changes: 67 additions & 0 deletions util/clean-spell
Original file line number Diff line number Diff line change
@@ -0,0 +1,67 @@
#!/usr/bin/env perl6

# Remove words in xt/*.pws that are no longer needed
# * Bug fixes in the spell checker have removed the need
# to check certain words.
# * Edits to the docs themselves no longer use some words.

# Trust but verify: make sure you rerun the entire spell check
# after letting this program update the .pws files

use File::Temp;

use lib 'lib';
use Test-Files;
use Pod::Cache;

my @files = Test-Files.documents.grep({not $_ ~~ / 'README.' .. '.md' /});

@files = @files.map({
$_.ends-with('.pod6') ?? Pod::Cache.cache-file($_) !! $_;
});

my %killed;

sub erase-word($file, @words, $word="") {
my ($tmp_fname, $tmp_io) = tempfile;
for @words -> $i {
next if $i eq $word;
next if %killed{$i}:exists;
$tmp_io.say($i);
}
$tmp_io.close;
run('mv', $tmp_fname, $file);
}

for <xt/words.pws xt/code.pws> -> $dict {
my @words = $dict.IO.lines;
for @words -> $word {
note "Testing $dict / $word ";
my $keep = True;

my $proc = Proc::Async.new( 'grep', '-li', $word, |@files);
my $output = "";
$proc.stdout.tap(-> $buf { $output ~= $buf });
my $promise = await $proc.start;

if +$promise.status {
say "Can't find $dict/$word anywhere, kill it.";
$keep = False;
} else {
# Remove the one word we're testing from the file.
erase-word($dict, @words, $word);
my @raw-files = $output.lines.map({ $_.subst('.pod-cache/', '') });
my $proc = run( 'xt/aspell.t', |@raw-files );
if $proc.exitcode == 0 {
say "aspell test passed";
$keep = False;
} else {
say "aspell test failed, keep it";
}
}
%killed{$word} = True unless $keep;
}
erase-word($dict, @words);
}

dd %killed;
55 changes: 0 additions & 55 deletions xt/code.pws
Original file line number Diff line number Diff line change
@@ -1,30 +1,18 @@
aaaa
aaaaa
aaaaaa
aaab
aaabbc
aaabbcccc
aaaxbbxc
aabb
aabbccc
aabbccddaa
aachen
aachen's
aaf
aagcct
aao
aapl
aaron
aaron's
abab
ababab
abababa
abacabadabacaba
abba
abbas
abbas's
abbasid
abbasid's
abbbbbcdddddeffg
abcd
abcde
Expand Down Expand Up @@ -61,8 +49,6 @@ aj
algebradebugger
algebraparser
aliquot
amd
amd's
ame
amet
amic
Expand All @@ -80,7 +66,6 @@ atf
atfoobar
atomicint
atomicints
atomicsize
autolines
axxxbxxxc
ay
Expand Down Expand Up @@ -111,7 +96,6 @@ bindingtype
birthdaycongrats
bitrary
bj
blake's
bn
bol
bq
Expand All @@ -127,12 +111,10 @@ bú
cadabra
cagcggaagcct
calc
callees
cannonname
canonidn
canonname
canwrite
capturename
carefulclass
cba
ccc
Expand Down Expand Up @@ -171,7 +153,6 @@ dgram
diceroll
digifier
digitmatcher
dirs
dirstat
diskn
doesntexist
Expand All @@ -181,16 +162,13 @@ doorhandle
dostuff
dx
dxex
dxvo
dynint
eb
ee
ef
efg
ehehe
elit
encodedbuffer
eocsv
eoh
eoi
eos
Expand All @@ -206,7 +184,6 @@ failgoal
failhash
fairycake
fatratstr
fbtb
feff
fffd
ffff
Expand All @@ -219,17 +196,13 @@ findnodes
firstname
firstpos
flowinfo
fn
fnorbl
fo
foldl
foldr
foobaz
foober
foodhandle
foohandle
fooobar
foooobar
foox
fooy
fooz
Expand All @@ -241,7 +214,6 @@ fptr
freeaddrinfo
freija
frob
frobnicate
frobs
fromcharcode
fubar
Expand All @@ -256,7 +228,6 @@ getaddrinfo
gg
gha
ghi
globalish
goog
grammaradvice
grassmannnumber
Expand All @@ -271,13 +242,11 @@ hdr
headn
hh
hhgttu
hhh
hola
hou
howd
httprequest
https
hyperwhatever
ic
idaqt
idn
Expand All @@ -286,7 +255,6 @@ ij
imm
indir
iniformat
inlinepython
innie
installable
installermaker
Expand All @@ -296,7 +264,6 @@ intillos
inv
invcsw
invertiblepoint
iol
ip
ipsum
ipv
Expand Down Expand Up @@ -352,7 +319,6 @@ mrcv
msnapper
msnd
msvc
mtest
muchmoresecure
mult
myapp
Expand Down Expand Up @@ -385,8 +351,6 @@ nbsp
newfunc
nextone
niler
nith
nko
nodir
noez
nosuch
Expand Down Expand Up @@ -428,14 +392,12 @@ plustwo
postfixed
postgre
postorder
precompilationrepository
precompilationstore
predictiveiterator
prettylist
priv
prog
propspec
ptestpass
pwstruct
pêrl
q'this
Expand All @@ -448,7 +410,6 @@ rawheader
rbar
rdm
rectanglewithcachedarea
regexname
rememberit
renderbarchart
repeatchar
Expand Down Expand Up @@ -483,40 +444,29 @@ someparentclass
somerole
sometext
sortedarray
sourcecode
speedoflight
spoint
sprintfformat
sref
ssz
startee
stmt
strcpy
strdistance
strillo
strorarrayofstr
strs
structobj
su
supplys
tac
tbar
tbaz
tcd
temphandle
tes
testactions
testanimal
testee
testfile
testgrammar
testpass
textnode
that'sawesome
thatmodule
theclass
thename
thereifixedit
thid
threadpool
tjd
Expand All @@ -542,15 +492,13 @@ typedef
typehouse
typer
tys
uares
ubits
uia
unitcheck
unitish
unspec
userblock
userprofile
utestuser
valueobjat
versionmajor
versionminor
Expand All @@ -567,8 +515,6 @@ withoutlinenumber
withtype
wix
wne
wraphandler
wrappee
xa
xab
xaf
Expand All @@ -588,7 +534,6 @@ yeterani
yourapp
yourclass
yourmodule
yournick
yy
yz
za
Expand Down
Loading

0 comments on commit 5683411

Please sign in to comment.