Lingua-TFIDF

 view release on metacpan or  search on metacpan

lib/Lingua/TFIDF/WordSegmenter/JA/MeCab.pm  view on Meta::CPAN

use Text::MeCab;

my $mecab_encoding = Encode::find_encoding(Text::MeCab::ENCODING);

sub new {
  args
    my $class => 'ClassName',
    my $mecab => +{ isa => 'Text::MeCab', optional => 1 };

  $mecab = Text::MeCab->new unless defined $mecab;
  bless +{ mecab => $mecab } => $class;
}

sub mecab { $_[0]->{mecab} }

sub segment {
  args_pos
    my $self,
    my $document => 'Ref | Str';

  my $input = $mecab_encoding->encode(ref $document ? $$document : $document);

lib/Lingua/TFIDF/WordSegmenter/LetterNgram.pm  view on Meta::CPAN

use Carp qw//;
use Smart::Args;

sub new {
  args
    my $class => 'ClassName',
    my $n => 'Int';

  Carp::croak('Word length must be 1+.') if $n <= 0;

  bless +{ n => $n } => $class;
}

sub n { $_[0]->{n} }

sub segment {
  args_pos
    my $self,
    my $document => 'Ref | Str';

  $document = \"$document" unless ref $document;

 view all matches for this distribution
 view release on metacpan -  search on metacpan

( run in 1.378 second using v1.00-cache-2.02-grep-82fe00e-cpan-1925d2aa809 )