Back | WordLists

BulgarianStemmer - bulgarianStemmer.txt

Download Complete Wordlist (4.07 K)
Download Complete Wordlist bzip2 Compressed (1.25 K)
Showing 38 Randomly Sampled Lines...
return(substr($word,0,$i-4));
$word = $_[0];
$line =~ s/^(\s)+//;
}
}
# Light stemmer for Bulgarian language (to be viewed by selecti
return(substr($word,0,$i-6));
print "$stem\n";
}
return($line);
return(substr($word,0,$i-4));
$line = substr($line,0,$i-6);
};
if ($word =~ m/еве$/) { # final -eBe --> N
$i -= 2;
# Light stemmer for Bulgarian language (to be viewed by selecting UTF-8 en
# Light stemmer for Bulgarian language (to be viewed by selecting UTF-8 encoding)
return($line);
$line = substr($line,0,$i-2);
my($line, $i);
if ($i > 10) {
my($word, $i); # use local var $word and $i
substr($line,$i-4,4) = substr($line,$i-2,2);
if ($word =~ m/зи$/) { # final -(e)H --> T
# We assume that each character (in Cyrillic) needs two bytes
# rewritting rule -eH into -H
my($word, $i); # use a local var $word and $i
if ($word =~ m/е..и$/) { # rewritting rule
return($word);
$word =~ s/ци$/к/;
$word =~ s/зи$/г/;
if ($word =~ m/ия$/) { # final -H(R)
if ($word =~ m/си$/) { # final -cH --> x
if ($word =~ m/ове$/) { # final -OBe
return(substr($word,0,$i-4));
}
}
# done by J. Savoy University of Neuchatel (www.unine.ch/info


Back | WordLists