File Coverage

File:	lib/CheckSpelling/SpellingCollator.pm
Coverage:	83.4%

line	stmt	bran	cond	sub	time	code
1						#! --perl--
2
3						package CheckSpelling::SpellingCollator;
4
5						our $VERSION='0.1.0';
6	1 1 1			1	105798 2 23	use warnings;
7	1 1 1			1	2 1 23	use File::Path qw(remove_tree);
8	1 1 1			1	182 1 2155	use CheckSpelling::Util;
9
10						my %letter_map;
11						my %ignored_event_map;
12						my $disable_word_collating;
13
14						sub get_field {
15	28			28	22	my ($record, $field) = @_;
16	28	100			315	return 0 unless $record =~ (/\b$field:\s*(\d+)/);
17	16				21	return $1;
18						}
19
20						sub get_array {
21	2			2	2	my ($record, $field) = @_;
22	2	50			14	return () unless $record =~ (/\b$field: \[([^\]]+)\]/);
23	2				2	my $values = $1;
24	2				3	return split /\s,\s/, $values;
25						}
26
27						sub maybe {
28	7			7	7	my ($next, $value) = @_;
29	7	50	67		9	$next = $value unless $next && $next < $value;
30	7				5	return $next;
31						}
32
33						my %expected = ();
34						sub expect_item {
35	98			98	52	my ($item, $value) = @_;
36	98				42	our %expected;
37	98				30	my $next;
38	98	100 100			101	if (defined $expected{$item}) {
39	26				11	$next = $expected{$item};
40	26	100			21	$next = $value if $value < $next;
41						} elsif ($item =~ /^([A-Z])(.*)/) {
42	12				8	$item = $1 . lc $2;
43	12	100			9	if (defined $expected{$item}) {
44	2				2	$next = $expected{$item};
45	2				1	$next = maybe($next, $value + .1);
46						} else {
47	10				7	$item = lc $item;
48	10	100			10	if (defined $expected{$item}) {
49	5				5	$next = $expected{$item};
50	5				1	$next = maybe($next, $value + .2);
51						}
52						}
53						}
54	98	100			101	return 0 unless defined $next;
55	33				19	$expected{$item} = $next;
56	33				64	return $value;
57						}
58
59						sub skip_item {
60	52			52	22	my ($word) = @_;
61	52	100			37	return 1 if expect_item($word, 1);
62	32				21	my $key = lc $word;
63	32	50			14	return 2 if expect_item($key, 2);
64	32	100 100 100			43	if ($key =~ /.s$/) {
65	2	100			3	if ($key =~ /ies$/) {
66	1				12	$key =~ s/ies$/y/;
67						} else {
68	1				1	$key =~ s/s$//;
69						}
70						} elsif ($key =~ /^(.+[^aeiou])ed$/) {
71	1				1	$key = $1;
72						} elsif ($key =~ /^(.+)'[ds]$/) {
73	6				2	$key = $1;
74						} else {
75	23				19	return 0;
76						}
77	9	50			9	return 3 if expect_item($key, 3);
78	0				0	return 0;
79						}
80
81						sub should_skip_warning {
82	69			69	45	my ($warning) = @_;
83	69	100			86	if ($warning =~ /$([-\w]+)$$/) {
84	68				39	my ($code) = ($1);
85	68				24	our %ignored_event_map;
86	68	100			51	return 1 if $ignored_event_map{$code};
87						}
88	68				47	return 0;
89						}
90
91						sub log_skip_item {
92	48			48	55	my ($item, $file, $warning, $unknown_word_limit) = @_;
93	48	50			33	return 1 if should_skip_warning $warning;
94	48	100			33	return 1 if skip_item($item);
95	19				13	my $seen_count = $seen{$item};
96	19	100			11	if (defined $seen_count) {
97	6	100	100		10	if (!defined $unknown_word_limit \|\| ($seen_count++ < $unknown_word_limit)) {
98	5				22	print MORE_WARNINGS "$file$warning\n"
99						} else {
100	1				2	$last_seen{$item} = "$file$warning";
101						}
102	6				5	$seen{$item} = $seen_count;
103	6				9	return 1;
104						}
105	13				11	$seen{$item} = 1;
106	13				14	return 0;
107						}
108
109						sub stem_word {
110	22			22	9	my ($key) = @_;
111	22				11	our $disable_word_collating;
112	22	50			9	return $key if $disable_word_collating;
113
114	22	100 100			25	if ($key =~ /.s$/) {
115	3	100			5	if ($key =~ /ies$/) {
116	1				3	$key =~ s/ies$/y/;
117						} else {
118	2				2	$key =~ s/s$//;
119						}
120						} elsif ($key =~ /.[^aeiou]ed$/) {
121	1				2	$key =~ s/ed$//;
122						}
123	22				15	return $key;
124						}
125
126						sub collate_key {
127	77			77	48	my ($key) = @_;
128	77				30	our $disable_word_collating;
129	77	100			42	if ($disable_word_collating) {
130	16				16	$char = lc substr $key, 0, 1;
131						} else {
132	61				41	$key = lc $key;
133	61				41	$key =~ s/''+/'/g;
134	61				34	$key =~ s/'[sd]$//;
135	61				35	$key =~ s/^[^Ii]?'+(.*)/$1/;
136	61				25	$key =~ s/(.*?)'$/$1/;
137	61				54	$char = substr $key, 0, 1;
138						}
139	77				92	return ($key, $char);
140						}
141
142						sub load_expect {
143	9			9	473	my ($expect) = @_;
144	9				5	our %expected;
145	9				9	%expected = ();
146	9	50			76	if (open(EXPECT, '<:utf8', $expect)) {
147	9				58	while ($word = <EXPECT>) {
148	34				49	$word =~ s/\R//;
149	34				68	$expected{$word} = 0;
150						}
151	9				32	close EXPECT;
152						}
153						}
154
155						sub harmonize_expect {
156	8			8	5	our $disable_word_collating;
157	8				4	our %letter_map;
158	8				2	our %expected;
159
160	8				12	for my $word (keys %expected) {
161	31				19	my ($key, $char) = collate_key $word;
162	31				15	my %word_map = ();
163	31	100			37	next unless defined $letter_map{$char}{$key};
164	15 15				2 23	%word_map = %{$letter_map{$char}{$key}};
165	15	100			18	next if defined $word_map{$word};
166	3				1	my $words = scalar keys %word_map;
167	3	50			2	next if $words > 2;
168	3	100			3	if ($word eq $key) {
169	1	50			1	next if ($words > 1);
170						}
171	2				3	delete $expected{$word};
172						}
173						}
174
175						sub group_related_words {
176	9			9	26	our %letter_map;
177	9				4	our $disable_word_collating;
178	9	100			7	return if $disable_word_collating;
179
180						# group related words
181	7				16	for my $char (sort CheckSpelling::Util::number_biased keys %letter_map) {
182	19 19				12 15	for my $plural_key (sort keys(%{$letter_map{$char}})) {
183	22				14	my $key = stem_word $plural_key;
184	22	100			18	next if $key eq $plural_key;
185	4	100			3	next unless defined $letter_map{$char}{$key};
186	3 3				3 3	my %word_map = %{$letter_map{$char}{$key}};
187	3 3				1 4	for $word (keys(%{$letter_map{$char}{$plural_key}})) {
188	3				3	$word_map{$word} = 1;
189						}
190	3				3	$letter_map{$char}{$key} = \%word_map;
191	3				4	delete $letter_map{$char}{$plural_key};
192						}
193						}
194						}
195
196						sub count_warning {
197	10			10	29	my ($warning) = @_;
198	10				4	our %counters;
199	10				6	our %ignored_event_map;
200	10	100			17	if ($warning =~ /$([-\w]+)$$/) {
201	8				5	my ($code) = ($1);
202	8	50			8	next if defined $ignored_event_map{$code};
203	8				9	++$counters{$code};
204						}
205						}
206
207						sub report_timing {
208	0			0	0	my ($name, $start_time, $directory, $marker) = @_;
209	0				0	my $end_time = (stat "$directory/$marker")[9];
210	0				0	$name =~ s/"/\\"/g;
211	0				0	print TIMING_REPORT "\"$name\", $start_time, $end_time\n";
212						}
213
214						sub get_pattern_with_context {
215	18			18	9	my ($path) = @_;
216	18	100			19	return unless defined $ENV{$path};
217	9				9	$ENV{$path} =~ /(.*)/;
218	9	50			55	return unless open ITEMS, '<:utf8', $1;
219
220	9				5	my @items;
221	9				4	my $context = '';
222	9				41	while (<ITEMS>) {
223	2				2	my $pattern = $_;
224	2	100			3	if ($pattern =~ /^#/) {
225	1	50			2	if ($pattern =~ /^# /) {
226	1				2	$context .= $pattern;
227						} else {
228	0				0	$context = '';
229						}
230	1				2	next;
231						}
232	1				1	chomp $pattern;
233	1	50			4	unless ($pattern =~ /./) {
234	0				0	$context = '';
235	0				0	next;
236						}
237	1				2	push @items, $context.$pattern;
238	1				2	$context = '';
239						}
240	9				24	close ITEMS;
241	9				10	return @items;
242						}
243
244						sub summarize_totals {
245	18			18	13	my ($formatter, $path, $items, $totals, $file_counts) = @_;
246	18 18	100			7 19	return unless @{$totals};
247	1	50			20	return unless open my $fh, '>:utf8', $path;
248	1 1				0 1	my $totals_count = scalar(@{$totals}) - 1;
249	1				1	my @indices;
250	1	50			1	if ($file_counts) {
251						@indices = sort {
252	0 0	0			0 0	$totals->[$b] <=> $totals->[$a] \|\|
253						$file_counts->[$b] <=> $file_counts->[$a]
254						} 0 .. $totals_count;
255						} else {
256						@indices = sort {
257	1 0				1 0	$totals->[$b] <=> $totals->[$a]
258						} 0 .. $totals_count;
259						}
260	1				1	for my $i (@indices) {
261	1	50			1	last unless $totals->[$i] > 0;
262	1				1	my $rule_with_context = $items->[$i];
263	1				1	my ($description, $rule);
264	1	50			2	if ($rule_with_context =~ /^(.*\n)([^\n]+)$/s) {
265	1				2	($description, $rule) = ($1, $2);
266						} else {
267	0				0	($description, $rule) = ('', $rule_with_context);
268						}
269	1	50			1	print $fh $formatter->(
270						$totals->[$i],
271						($file_counts ? " file-count: $file_counts->[$i]" : ""),
272						$description,
273						$rule
274						);
275						}
276	1				39	close $fh;
277						}
278
279						sub main {
280	9			9	15895	my @directories;
281						my @cleanup_directories;
282	9				0	my @check_file_paths;
283
284	9				9	my $early_warnings = CheckSpelling::Util::get_file_from_env('early_warnings', '/dev/null');
285	9				7	my $warning_output = CheckSpelling::Util::get_file_from_env('warning_output', '/dev/stderr');
286	9				5	my $more_warnings = CheckSpelling::Util::get_file_from_env('more_warnings', '/dev/stderr');
287	9				5	my $counter_summary = CheckSpelling::Util::get_file_from_env('counter_summary', '/dev/stderr');
288	9				7	my $ignored_events = CheckSpelling::Util::get_file_from_env('ignored_events', '');
289	9	100			8	if ($ignored_events) {
290	2				0	our %ignored_event_map;
291	2				4	for my $event (split /,/, $ignored_events) {
292	2				2	$ignored_event_map{$event} = 1;
293						}
294						}
295	9				9	my $should_exclude_file = CheckSpelling::Util::get_file_from_env('should_exclude_file', '/dev/null');
296	9				6	my $unknown_word_limit = CheckSpelling::Util::get_val_from_env('unknown_word_limit', undef);
297	9				6	my $unknown_file_word_limit = CheckSpelling::Util::get_val_from_env('unknown_file_word_limit', undef);
298	9				5	my $candidate_example_limit = CheckSpelling::Util::get_file_from_env('INPUT_CANDIDATE_EXAMPLE_LIMIT', '3');
299	9				4	my $disable_flags = CheckSpelling::Util::get_file_from_env('INPUT_DISABLE_CHECKS', '');
300	9				5	my $only_check_changed_files = CheckSpelling::Util::get_file_from_env('INPUT_ONLY_CHECK_CHANGED_FILES', '');
301	9				6	my $disable_noisy_file = $disable_flags =~ /(?:^\|,\|\s)noisy-file(?:,\|\s\|$)/;
302	9		67		24	our $disable_word_collating = $only_check_changed_files \|\| $disable_flags =~ /(?:^\|,\|\s)word-collating(?:,\|\s\|$)/;
303	9				7	my $file_list = CheckSpelling::Util::get_file_from_env('check_file_names', '');
304	9				6	my $timing_report = CheckSpelling::Util::get_file_from_env('timing_report', '');
305	9				7	my ($start_time, $end_time);
306
307	9				171	open WARNING_OUTPUT, '>:utf8', $warning_output;
308	9				129	open MORE_WARNINGS, '>:utf8', $more_warnings;
309	9				108	open COUNTER_SUMMARY, '>:utf8', $counter_summary;
310	9				67	open SHOULD_EXCLUDE, '>:utf8', $should_exclude_file;
311	9	50			6	if ($timing_report) {
312	0				0	open TIMING_REPORT, '>:utf8', $timing_report;
313	0				0	print TIMING_REPORT "file, start, finish\n";
314						}
315
316	9				7	my @candidates = get_pattern_with_context('candidates_path');
317	9				8	my @candidate_totals = (0) x scalar @candidates;
318	9				3	my @candidate_file_counts = (0) x scalar @candidates;
319
320	9				7	my @forbidden = get_pattern_with_context('forbidden_path');
321	9				9	my @forbidden_totals = (0) x scalar @forbidden;
322
323	9				5	my @delayed_warnings;
324	9				20	our %letter_map = ();
325
326	9				3	my %file_map = ();
327
328	9				21	for my $directory (<>) {
329	12				12	chomp $directory;
330	12	50			20	next unless $directory =~ /^(.*)$/;
331	12				8	$directory = $1;
332	12	100			36	unless (-e $directory) {
333	1				2	print STDERR "Could not find: $directory\n";
334	1				1	next;
335						}
336	11	100			27	unless (-d $directory) {
337	1				11	print STDERR "Not a directory: $directory\n";
338	1				1	next;
339						}
340
341						# if there's no filename, we can't report
342	10	100			68	next unless open(NAME, '<:utf8', "$directory/name");
343	9				49	my $file=<NAME>;
344	9				34	close NAME;
345
346	9				19	$file_map{$file} = $directory;
347						}
348
349	9				14	for my $file (sort keys %file_map) {
350	9				8	my $directory = $file_map{$file};
351	9	50			7	if ($timing_report) {
352	0				0	$start_time = (stat "$directory/name")[9];
353						}
354
355	9	100			44	if (-e "$directory/skipped") {
356	1				7	open SKIPPED, '<:utf8', "$directory/skipped";
357	1				8	my $reason=<SKIPPED>;
358	1				2	close SKIPPED;
359	1				1	chomp $reason;
360	1				5	push @delayed_warnings, "$file:1:1 ... 1, Warning - Skipping `$file` because $reason\n";
361	1				8	print SHOULD_EXCLUDE "$file\n";
362	1				1	push @cleanup_directories, $directory;
363	1	50			1	report_timing($file, $start_time, $directory, 'skipped') if ($timing_report);
364	1				1	next;
365						}
366
367						# stats isn't written if there was nothing interesting in the file
368	8	100			26	unless (-s "$directory/stats") {
369	1				1	push @directories, $directory;
370	1	50			0	report_timing($file, $start_time, $directory, 'warnings') if ($timing_report);
371	1				1	next;
372						}
373
374	7	100			7	if ($file eq $file_list) {
375	1				6	open FILE_LIST, '<:utf8', $file_list;
376	1				1	push @check_file_paths, '0 placeholder';
377	1				5	for my $check_file_path (<FILE_LIST>) {
378	4				3	chomp $check_file_path;
379	4				4	push @check_file_paths, $check_file_path;
380						}
381	1				5	close FILE_LIST;
382						}
383
384	7				4	my ($words, $unrecognized, $unknown, $unique);
385
386						{
387	7 7				3 58	open STATS, '<:utf8', "$directory/stats";
388	7				34	my $stats=<STATS>;
389	7				12	close STATS;
390	7				5	$words=get_field($stats, 'words');
391	7				5	$unrecognized=get_field($stats, 'unrecognized');
392	7				5	$unknown=get_field($stats, 'unknown');
393	7				7	$unique=get_field($stats, 'unique');
394	7				5	my @candidate_list;
395	7	50			4	if (@candidate_totals) {
396	0				0	@candidate_list=get_array($stats, 'candidates');
397	0				0	my @lines=get_array($stats, 'candidate_lines');
398	0	0			0	if (@candidate_list) {
399	0				0	for (my $i=0; $i < scalar @candidate_list; $i++) {
400	0				0	my $hits = $candidate_list[$i];
401	0	0			0	if ($hits) {
402	0				0	$candidate_totals[$i] += $hits;
403	0	0			0	if ($candidate_file_counts[$i]++ < $candidate_example_limit) {
404	0				0	my $pattern = (split /\n/,$candidates[$i])[-1];
405	0				0	my $position = $lines[$i];
406	0				0	$position =~ s/:(\d+)$/ ... $1/;
407	0				0	my $wrapped = CheckSpelling::Util::wrap_in_backticks($pattern);
408	0				0	push @delayed_warnings, "$file:$position, Notice - Line matches candidate pattern $wrapped (candidate-pattern)\n";
409						}
410						}
411						}
412						}
413						}
414	7	100			8	if (@forbidden_totals) {
415	1				1	@forbidden_list=get_array($stats, 'forbidden');
416	1				1	my @lines=get_array($stats, 'forbidden_lines');
417	1	50			1	if (@forbidden_list) {
418	1				1	for (my $i=0; $i < scalar @forbidden_list; $i++) {
419	1				1	my $hits = $forbidden_list[$i];
420	1	50			1	if ($hits) {
421	1				2	$forbidden_totals[$i] += $hits;
422						}
423						}
424						}
425						}
426						#print STDERR "$file (unrecognized: $unrecognized; unique: $unique; unknown: $unknown, words: $words, candidates: [".join(", ", @candidate_list)."])\n";
427						}
428
429	7	50			5	report_timing($file, $start_time, $directory, 'unknown') if ($timing_report);
430						# These heuristics are very new and need tuning/feedback
431	7	50			9	if (
432						($unknown > $unique)
433						# \|\| ($unrecognized > $words / 2)
434						) {
435	0	0			0	unless ($disable_noisy_file) {
436	0	0			0	if ($file ne $file_list) {
437	0				0	push @delayed_warnings, "$file:1:1 ... 1, Warning - Skipping `$file` because it seems to have more noise ($unknown) than unique words ($unique) (total: $unrecognized / $words). (noisy-file)\n";
438	0				0	print SHOULD_EXCLUDE "$file\n";
439						} else {
440	0				0	push @delayed_warnings, "$file:1:1 ... 1, Warning - Skipping file list because there seems to be more noise ($unknown) than unique words ($unique) (total: $unrecognized / $words). (noisy-file-list)\n";
441						}
442	0				0	push @directories, $directory;
443	0				0	next;
444						}
445						}
446	7	100			29	unless (-s "$directory/unknown") {
447	1				1	push @directories, $directory;
448	1				1	next;
449						}
450	6				38	open UNKNOWN, '<:utf8', "$directory/unknown";
451	6				42	for $token (<UNKNOWN>) {
452	49				47	$token =~ s/\R//;
453	49	100			46	next unless $token =~ /./;
454	46				26	my ($key, $char) = collate_key $token;
455	46	100			54	$letter_map{$char} = () unless defined $letter_map{$char};
456	46				20	my %word_map = ();
457	46 14	100			39 17	%word_map = %{$letter_map{$char}{$key}} if defined $letter_map{$char}{$key};
458	46				47	$word_map{$token} = 1;
459	46				62	$letter_map{$char}{$key} = \%word_map;
460						}
461	6				20	close UNKNOWN;
462	6				9	push @directories, $directory;
463						}
464	9				22	close SHOULD_EXCLUDE;
465	9	50			9	close TIMING_REPORT if $timing_report;
466
467						summarize_totals(
468						sub {
469	0			0	0	my ($hits, $files, $context, $pattern) = @_;
470	0				0	return "# hit-count: $hits$files\n$context$pattern\n\n",
471						},
472	9				27	CheckSpelling::Util::get_file_from_env('candidate_summary', '/dev/stderr'),
473						\@candidates,
474						\@candidate_totals,
475						\@candidate_file_counts,
476						);
477
478						summarize_totals(
479						sub {
480	1			1	1	my (undef, undef, $context, $pattern) = @_;
481	1				2	$context =~ s/^# //gm;
482	1				1	chomp $context;
483	1				1	my $details;
484	1	50			3	if ($context =~ /^(.?)$(.)/ms) {
485	1				1	($context, $details) = ($1, $2);
486	1	50			1	$details = "\n$details" if $details;
487						}
488	1	50			1	$context = 'Pattern' unless $context;
489	1				9	return "#### $context$details\n```\n$pattern\n```\n\n";
490						},
491	9				27	CheckSpelling::Util::get_file_from_env('forbidden_summary', '/dev/stderr'),
492						\@forbidden,
493						\@forbidden_totals,
494						);
495
496	9				27	group_related_words;
497
498	9	100			11	if (defined $ENV{'expect'}) {
499	8				8	$ENV{'expect'} =~ /(.*)/;
500	8				6	load_expect $1;
501	8				8	harmonize_expect;
502						}
503
504	9				8	my %seen = ();
505	9				4	our %counters;
506	9				5	%counters = ();
507
508	9	100			31	if (-s $early_warnings) {
509	1				6	open WARNINGS, '<:utf8', $early_warnings;
510	1				9	for my $warning (<WARNINGS>) {
511	1				2	chomp $warning;
512	1				1	count_warning $warning;
513	1	50			1	next if should_skip_warning $warning;
514	1				4	print WARNING_OUTPUT "$warning\n";
515						}
516	1				3	close WARNINGS;
517						}
518
519	9				4	my %last_seen;
520						my %unknown_file_word_count;
521	9				5	for my $directory (@directories) {
522	8	100			27	next unless (-s "$directory/warnings");
523	7	50			44	next unless open(NAME, '<:utf8', "$directory/name");
524	7				30	my $file=<NAME>;
525	7				14	close NAME;
526	7				16	my $is_file_list = $file eq $file_list;
527	7				37	open WARNINGS, '<:utf8', "$directory/warnings";
528	7	100			5	if (!$is_file_list) {
529	6				37	for $warning (<WARNINGS>) {
530	49				32	chomp $warning;
531	49	100			88	if ($warning =~ m/:(\d+):(\d+ \.\.\. \d+): `(.*)`/) {
532	48				47	my ($line, $range, $item) = ($1, $2, $3);
533	48				27	my $wrapped = CheckSpelling::Util::wrap_in_backticks($item);
534	48				99	$warning =~ s/:\d+:\d+ \.\.\. \d+: `.*`/:$line:$range, Warning - $wrapped is not a recognized word\. $unrecognized-spelling$/;
535	48	100			30	next if log_skip_item($item, $file, $warning, $unknown_word_limit);
536						} else {
537	1	50			1	if ($warning =~ /\`(.*?)\` in line\. $token-is-substring$/) {
538	0	0			0	next if skip_item($1);
539						}
540	1				1	count_warning $warning;
541						}
542	14	50			9	next if should_skip_warning $warning;
543	14				42	print WARNING_OUTPUT "$file$warning\n";
544						}
545						} else {
546	1				8	for $warning (<WARNINGS>) {
547	6				6	chomp $warning;
548	6	50			11	next unless $warning =~ s/^:(\d+)/:1/;
549	6				6	$file = $check_file_paths[$1];
550	6	100			20	if ($warning =~ s/:(\d+ \.\.\. \d+): `(.*)`/:$1, Warning - `$2` is not a recognized word\. $check-file-path$/) {
551	4	50			1	next if skip_item($2);
552	4	50			7	if (defined $unknown_file_word_limit) {
553	4	100			6	next if ++$unknown_file_word_count{$2} > $unknown_file_word_limit;
554						}
555						}
556	5	100			5	next if should_skip_warning $warning;
557	4				11	print WARNING_OUTPUT "$file$warning\n";
558	4				5	count_warning $warning;
559						}
560						}
561	7				27	close WARNINGS;
562						}
563	9				162	close MORE_WARNINGS;
564
565	9				7	for my $warning (@delayed_warnings) {
566	1	50			1	next if should_skip_warning $warning;
567	1				1	count_warning $warning;
568	1				1	print WARNING_OUTPUT $warning;
569						}
570	9	100			7	if (defined $unknown_word_limit) {
571	1				2	for my $warned_word (sort keys %last_seen) {
572	0				0	my $warning_count = $seen{$warned_word};
573	0	0			0	next unless $warning_count >= $unknown_word_limit;
574	0				0	my $warning = $last_seen{$warned_word};
575	0				0	$warning =~ s/\Q. (unrecognized-spelling)\E/ -- found $warning_count times. (limited-references)\n/;
576	0	0			0	next if should_skip_warning $warning;
577	0				0	print WARNING_OUTPUT $warning;
578	0				0	count_warning $warning;
579						}
580						}
581	9				207	close WARNING_OUTPUT;
582
583	9	100			17	if (%counters) {
584	2				2	my $continue='';
585	2				3	print COUNTER_SUMMARY "{\n";
586	2				4	for my $code (sort keys %counters) {
587	4				6	print COUNTER_SUMMARY qq<$continue"$code": $counters{$code}\n>;
588	4				4	$continue=',';
589						}
590	2				2	print COUNTER_SUMMARY "}\n";
591						}
592	9				66	close COUNTER_SUMMARY;
593
594						# display the current unknown
595	9				20	for my $char (sort keys %letter_map) {
596	34 34				19 62	for $key (sort CheckSpelling::Util::case_biased keys(%{$letter_map{$char}})) {
597	29 29				14 39	my %word_map = %{$letter_map{$char}{$key}};
598	29				23	my @words = keys(%word_map);
599	29	100			22	if (scalar(@words) > 1) {
600	13 21	50			9 75	print $key." (".(join ", ", sort { length($a) <=> length($b) \|\| $a cmp $b } @words).")";
601						} else {
602	16				52	print $words[0];
603						}
604	29				96	print "\n";
605						}
606						}
607						}
608
609						1;