#!/usr/bin/env perl | |
# | |
# This file is part of moses. Its use is licensed under the GNU Lesser General | |
# Public License version 2.1 or, at your option, any later version. | |
use warnings; | |
use strict; | |
my ($size,$in,$out) = @ARGV; | |
open(IN,$in); | |
open(OUT,">$out"); | |
binmode(IN, ":utf8"); | |
binmode(OUT, ":utf8"); | |
while(<IN>) { | |
my $first = 1; | |
chomp; s/\s+/ /g; s/^ //; s/ $//; | |
foreach my $word (split) { | |
if (length($word) > $size) { | |
$word = substr($word,length($word)-$size); | |
} | |
print OUT " " unless $first; | |
$first = 0; | |
print OUT lc($word); | |
} | |
print OUT "\n"; | |
} | |
close(OUT); | |
close(IN); | |