5 my $input_file = shift;
\r
6 my $output_file = shift;
\r
8 open( my $f, $input_file ) or die "Cannot open input file $input_file";
\r
12 $text .= $_ while (<$f>) ;
\r
15 my @a = split /[^\w'-]/, $text ;
\r
16 foreach my $w (@a) {
\r
17 $words{$w} += 1 if $w ;
\r
19 for (my $j = 1; $j < 30; ++$j ) {
\r
20 for ( my $i = 0; $i + $j - 1 < @a; $i += 1 ) {
\r
22 for ( my $k = 0; $k < $j; ++$k ) {
\r
23 $s .= ' '.$a[$i+$k];
\r
25 $s =~ /\s*(\S.+\S)\s*/;
\r
32 open (my $dst, ">$output_file") or die "Cannot open output file $output_file";
\r
36 $nCount++ foreach (keys %words) ;
\r
37 print $dst $nCount, "\n" ;
\r
39 print "Generate test dictionary $output_file ...\n" ;
\r
40 print $dst $_, "\n" foreach (keys %words) ;
\r