App-RecordStream

 view release on metacpan or  search on metacpan

lib/App/RecordStream/Operation/generate.pm  view on Meta::CPAN

use strict;

use base qw(App::RecordStream::Operation);

use App::RecordStream::Executor::Getopt;
use App::RecordStream::Executor;

use Data::Dumper;
use App::RecordStream::InputStream;
use App::RecordStream::Record;
use App::RecordStream::Executor;

sub init {
  my $this = shift;
  my $args = shift;

  my $keychain = '_chain';
  my $passthrough = 0;
  my $executor_options = App::RecordStream::Executor::Getopt->new();

  my $spec = {
    'keychain=s'  => \$keychain,
    'passthrough' => \$passthrough,
    $executor_options->arguments(),
  };

  $this->parse_options($args, $spec, ['bundling']);

  my $expression = $executor_options->get_string($args);
  my $executor = App::RecordStream::Executor->new($expression);

  $this->{'KEYCHAIN'}    = $keychain;
  $this->{'PASSTHROUGH'} = $passthrough;
  $this->{'EXECUTOR'} = $executor;
}

sub accept_record {
  my $this = shift;
  my $record = shift;

  $this->push_record($record) if $this->{'PASSTHROUGH'};

  my $interpolated_command = $this->{'EXECUTOR'}->execute_code($record);

  if ($@) {
    chomp $@;
    warn "# $0 interpolating command threw: " . $@ . "\n";
    return 1;
  }

  my $pid = open(my $pipe, "-|", $interpolated_command);

  if (!$pid) {
    warn "# $0 open(..., \"$interpolated_command |\") failed: $!\n";
    return 1;
  }

  my $generator_stream = App::RecordStream::InputStream->new(FH => $pipe);

  while(my $generated_record = $generator_stream->get_record()) {
    ${$generated_record->guess_key_from_spec($this->{'KEYCHAIN'})} = $record->as_hashref();
    $this->push_record($generated_record);
  }
  # App::RecordStream::InputStream closes the file handle for us

  return 1;
}

sub add_help_types {
  my $this = shift;
  $this->use_help_type('keyspecs');
}

sub usage
{
  my $this = shift;

  my $options = [
    App::RecordStream::Executor::options_help(),
    [ 'passthrough', 'Emit input record in addition to generated records' ],
    [ 'keychain <name>', 'Use \'name\' as the chain key (default is \'_chain\') may be a key spec, see \'--help-keyspecs\' for more info' ],
  ];

  my $args_string = $this->options_string($options);

  my $usage = <<USAGE;
Usage: recs-generate <args> <command> [<files>]
   __FORMAT_TEXT__
   Executes <command> for each record to generate a record stream, which is
   then output with a chain link back to the original record.

   <command> is executed opened as a command for each record of input (or
   records from <files>) with \$r set to a App::RecordStream::Record object. The output
   lines of each command execution are interpreted as a serialized Recs records,
   one per line. Each such line is reconstituted as a App::RecordStream::Record, and the
   '_chain' key is added to the record before it is printed. The value of the
   '_chain' key is the record that was originally passed to the eval expression.
   __FORMAT_TEXT__

   For instance.  If you did:
   recs-generate "recs-fromatomfeed http://...?key=\$r->{title}..."

   with input that looked like:
   { 'title' : 'foo' }
   { 'title' : 'bar' }

   then recs-generate would end up executing:
   recs-fromatomfeed http://...?key=foo...

   __FORMAT_TEXT__
   and interpreting the result as a series of new line separated records.

   If the result from recs-fromatomfeed was something like:
   __FORMAT_TEXT__
   { 'title' : 'zip' }
   { 'title' : 'zap' }

   __FORMAT_TEXT__
   then recs-generate would add the chain link so the output would look like:
   __FORMAT_TEXT__
   { 'title' : 'zip', 'chain' : { 'title' : 'foo' } }



( run in 1.325 second using v1.01-cache-2.11-cpan-39bf76dae61 )