Alvis-TermTagger
view release on metacpan or search on metacpan
lib/Alvis/TermTagger.pm view on Meta::CPAN
open DESC_TERMLIST, $termlist_name or die "$0: $termlist_name: No such file\n";
binmode(DESC_TERMLIST, ":utf8");
while($line1 = <DESC_TERMLIST>) {
chomp $line1;
utf8::decode($line1);
$line=$line1;
# Blank and comment lines are throw away
if (($line !~ /^\s*\#/o)&&($line !~ /^\s*\/\//o)&&($line !~ /^\s*$/o)) {
# Term is split from the other information
my @tab = split / ?[\|:] ?/, $line;
if ($tab[0] !~ /^\s*$/) {
# TODO better
$tab[0] =~ s/ +/ /go;
$tab[0] =~ s/ $//go;
$tab[0] =~ s/^ //go;
# $tab[0] =~ s/\\:/:/go;
# warn "term: " . $tab[0] . "\n";;
( run in 0.593 second using v1.01-cache-2.11-cpan-cdf2f3d4e48 )