Aard
view release on metacpan or search on metacpan
lib/Aard.pm view on Meta::CPAN
my $fh = $self->{fh};
my $part;
seek $fh, $offset, 0;
read $fh, $part, $length;
$part
}
sub index1 {
my ($self, $index) = @_;
unless (exists $self->{index1}{$index}) {
my $part = $self->read_at($self->{index1_offset} + $index * $self->{index_length}, $self->{index_length});
$self->{index1}{$index} = [unpack $self->{index_format}, $part]
}
$self->{index1}{$index}
}
sub fh { shift->{fh} }
sub sha1sum { shift->{sha1sum} }
sub uuid { shift->{uuid} }
sub uuid_string { uuid_to_string shift->uuid }
sub volume { shift->{volume} }
sub total_volumes { shift->{total_volumes} }
sub count { shift->{index_count} }
sub meta { shift->{meta} }
sub article_count { shift->meta->{article_count} }
sub article_count_is_volume_total { shift->meta->{article_count_is_volume_total} }
sub index_language { shift->meta->{index_language} }
sub article_language { shift->meta->{article_language} }
sub title { shift->meta->{title} }
sub version { shift->meta->{version} }
sub description { shift->meta->{description} }
sub copyright { shift->meta->{copyright} }
sub license { shift->meta->{license} }
sub source { shift->meta->{source} }
sub key {
my ($self, $index) = @_;
unless (exists $self->{key}{$index}) {
my $part = $self->read_at($self->{index2_offset} + $self->index1($index)->[0], 2);
my $len = unpack 'S>', $part;
read $self->{fh}, $self->{key}{$index}, $len;
}
$self->{key}{$index}
}
sub article {
my ($self, $index) = @_;
unless (exists $self->{article}{$index}) {
my $part = $self->read_at($self->{article_offset} + $self->index1($index)->[1], 4);
my $len = unpack 'L>', $part;
read $self->{fh}, $part, $len;
$self->{article}{$index} = decompress $part
}
$self->{article}{$index}
}
sub new {
my ($self, $file) = @_;
open my $fh, '<', $file or die $!;
binmode $fh;
my %header;
for (@{HEADER_SPEC()}) {
read $fh, my $part, $_->[2];
$header{$_->[0]} = unpack $_->[1], $part;
}
die 'Not a recognized aarddict dictionary file' if $header{signature} ne 'aard';
die 'Unknown file format version' if $header{version} != 1;
read $fh, my $meta, $header{meta_length};
$meta = decode_json decompress $meta;
my %obj = (
%header,
fh => $fh,
meta => $meta,
index_format => ($header{index1_item_format} eq '>LL' ? 'L>L>' : 'L>Q>'),
index_length => ($header{index1_item_format} eq '>LL' ? 8 : 12),
);
$obj{index1_offset} = $header_length + $obj{meta_length};
$obj{index2_offset} = $obj{index1_offset} + $obj{index_count} * $obj{index_length};
bless \%obj, $self
}
1;
__END__
=head1 NAME
Aard - Read aarddict dictionaries
=head1 SYNOPSIS
use Aard;
my $dict = Aard->new('something.aar');
printf "This dictionary (volume %d of %d) has %d entries\n", $dict->volume, $dict->total_volumes, $dict->count;
printf "The tenth entry's key: %s\n", $dict->key(9);
printf "The tenth entry's value: %s\n", $dict->article(9);
=head1 DESCRIPTION
Aard is a module for reading files in the Aard Dictionary format (.aar). A dictionary is an array of I<(key, article)> pairs, with some associated metadata.
=over
=item B<new>(I<filename>)
Creates a new Aard object for the given file.
=item B<fh>
Returns the open filehandle to the dictionary.
=item B<count>
Returns the number of entries in this dictionary.
=item B<key>(I<index>)
Returns the key of the I<index>th element. This method caches the keys.
( run in 1.885 second using v1.01-cache-2.11-cpan-cdf2f3d4e48 )