Apache-Tika-Async
view release on metacpan or search on metacpan
bin/script.pl view on Meta::CPAN
#!perl -w
use strict;
use Apache::Tika::Server;
use Getopt::Long;
use File::Basename;
use File::Spec;
GetOptions(
'jar|j=s' => \my $tika_path,
);
use Data::Dumper;
if( ! $tika_path ) {
my $tika_glob = File::Spec->rel2abs( dirname($0) ) . '/../jar/*.jar';
$tika_path = Apache::Tika::Async->best_jar_file(glob $tika_glob);
die "Tika not found in '$tika_glob'" unless $tika_path and -f $tika_path;
}
my $tika= Apache::Tika::Server->new(
jarfile => $tika_path,
#connection_class => 'Apache::Tika::Connection::LWP',
connection_class => 'Apache::Tika::Connection::AEHTTP',
#java => '"C:/Program Files (x86)/Java/jre7/bin/java.exe"',
);
$tika->launch();
#my $tika= Apache::Tika->new;
my $fn= shift;
my $meta = $tika->get_meta($fn);
print "Content-Type: " . $meta->{'Content-Type'} . "\n";
print $tika->get_text($fn)->content;
#print Dumper $meta;
( run in 0.897 second using v1.01-cache-2.11-cpan-39bf76dae61 )