FunctionalPerl

 view release on metacpan or  search on metacpan

htmlgen/FunctionalPerl/Htmlgen/MarkdownPlus.pm  view on Meta::CPAN

#
# Copyright (c) 2014-2019 Christian Jaeger, copying@christianjaeger.ch
#
# This is free software, offered under either the same terms as perl 5
# or the terms of the Artistic License version 2 or the terms of the
# MIT License (Expat version). See the file COPYING.md that came
# bundled with this file.
#

=head1 NAME

FunctionalPerl::Htmlgen::MarkdownPlus

=head1 SYNOPSIS

    use FunctionalPerl::Htmlgen::MarkdownPlus qw(markdownplus_parse);
    use PXML::XHTML qw(BODY);

    my $mediawikitoken = rand;
    # passed to mediawiki_prepare from FunctionalPerl::Htmlgen::Mediawiki
    my ($h1,$body1) = markdownplus_parse(
          "# Hi\n\nHello [World](http://world).\n", # markdownplusstr
          "Hi too", # alternative_title
          $mediawikitoken);
    is $h1->string, '<h1>Hi</h1>';
    is BODY($body1)->string,
       '<body><p>Hello <a href="http://world">World</a>.</p></body>';


=head1 DESCRIPTION

C<markdownplus_parse> is a wrapper around L<Text::Markdown> that
parses the latter's html string to L<PXML::XHTML> elements
(C<PXML::_::XHTML> objects which are L<PXML::Element> objects). It
replaces mediawiki style links with tokens as a hack to make it
possible to implement those links without having to modify
L<Text::Markdown>.

(It also contains a hack to make C<<with_toc>...</with_toc>> tags
possible, but the actual implementation of the toc is independent.)

=head1 SEE ALSO

L<FunctionalPerl::Htmlgen::PXMLMapper> -- a protocol to further
process the parsed L<PXML>.

=head1 NOTE

This is alpha software! Read the status section in the package README
or on the L<website|http://functional-perl.org/>.

=cut

package FunctionalPerl::Htmlgen::MarkdownPlus;
use strict;
use warnings;
use warnings FATAL => 'uninitialized';
use experimental "signatures";
use Sub::Call::Tail;
use Exporter "import";

our @EXPORT      = qw();
our @EXPORT_OK   = qw(markdownplus_parse);
our %EXPORT_TAGS = (all => [@EXPORT, @EXPORT_OK]);

use FP::Docstring;
use Chj::TEST;
use PXML qw(is_pxml_element);
use PXML::XHTML ":all";
use FP::Stream ":all";
use FunctionalPerl::Htmlgen::Htmlparse 'htmlparse';
use Text::Markdown 'markdown';
use FP::Lazy;
use FunctionalPerl::Htmlgen::Mediawiki qw(mediawiki_prepare);

# Return <h1> element if available, and rest.
sub pxml_body_split_h1($body) {
    my $b = stream_mixed_flatten $body;
    my ($v, $rest) = $b->first_and_rest;
    if (is_pxml_element $v and $v->name eq "h1") { ($v, $rest) }
    else                                         { (undef, $body) }
}

TEST { [pxml_body_split_h1 ["foo"]] }
[undef, ['foo']];

TEST { [pxml_body_split_h1 [H1("x"), "foo"]]->[0] }
H1("x");

TEST {
    my ($h1, $rest) = pxml_body_split_h1 [H1("x", "y"), "foo", B("bar")];
    [$h1->string, BODY($rest)->string]
}
['<h1>xy</h1>', '<body>foo<b>bar</b></body>'];

sub markdownplus_parse ($str, $alternative_title, $mediawikitoken) {
    __
        '($str, $alternative_title, $tokenstr)-> ($h1, [$body_PXML_Elements], $hashtbl) '
        . '-- markdown parsing to PXML, extracting title, and replacing'
        . ' mediawiki syntax with $tokenstr based replacements'
        . ' (side channelling hack)';

    my ($str1, $table) = mediawiki_prepare($str, $mediawikitoken);

    my $htmlstr = markdown($str1);

    # XX hack: fix '<p><with_toc></p> .. <p></with_toc></p>' before
    # parsing, to avoid losing the with_toc element. Bah.
    $htmlstr =~ s|<p>\s*(</?with_toc[^<>]*>)\s*</p>|$1|sg;

    # `markdown` returns a series of <p> elements etc., not wrapped in
    # any element. Need to wrap it before parsing or it will drop the
    # outmost element if it's (e.g.?) <with_toc>.
    my $bodyelement = htmlparse('<body>' . $htmlstr . '</body>', "body");

    my $body = $bodyelement->body;
    my ($maybe_h1, $rest) = pxml_body_split_h1($body);
    (
        (
            defined $maybe_h1
            ? ($maybe_h1, $rest)
            : (H1(force($alternative_title)), $body)
        ),
        $table
    )
}

1



( run in 0.474 second using v1.01-cache-2.11-cpan-39bf76dae61 )