package Alien::Build::Plugin::Decode::HTML; use strict; use warnings; use 5.008004; use Alien::Build::Plugin; use File::Basename (); # ABSTRACT: Plugin to extract links from HTML our $VERSION = '2.45'; # VERSION sub init { my($self, $meta) = @_; $meta->add_requires('share' => 'HTML::LinkExtor' => 0); $meta->add_requires('share' => 'URI' => 0); $meta->add_requires('share' => 'URI::Escape' => 0); $meta->register_hook( decode => sub { my(undef, $res) = @_; die "do not know how to decode @{[ $res->{type} ]}" unless $res->{type} eq 'html'; my $base = URI->new($res->{base}); my @list; my $p = HTML::LinkExtor->new(sub { my($tag, %links) = @_; if($tag eq 'base' && $links{href}) { $base = URI->new($links{href}); } elsif($tag eq 'a' && $links{href}) { my $href = $links{href}; return if $href =~ m!^\.\.?/?$!; my $url = URI->new_abs($href, $base); my $path = $url->path; $path =~ s{/$}{}; # work around for Perl 5.8.7- gh#8 push @list, { filename => URI::Escape::uri_unescape(File::Basename::basename($path)), url => URI::Escape::uri_unescape($url->as_string), }; } }); $p->parse($res->{content}); return { type => 'list', list => \@list, }; }); $self; } 1; __END__ =pod =encoding UTF-8 =head1 NAME Alien::Build::Plugin::Decode::HTML - Plugin to extract links from HTML =head1 VERSION version 2.45 =head1 SYNOPSIS use alienfile; plugin 'Decode::HTML'; =head1 DESCRIPTION Note: in most case you will want to use L instead. It picks the appropriate decode plugin based on your platform and environment. In some cases you may need to use this plugin directly instead. This plugin decodes an HTML file listing into a list of candidates for your Prefer plugin. =head1 SEE ALSO L, L, L, L, L =head1 AUTHOR Author: Graham Ollis Eplicease@cpan.orgE Contributors: Diab Jerius (DJERIUS) Roy Storey (KIWIROY) Ilya Pavlov David Mertens (run4flat) Mark Nunberg (mordy, mnunberg) Christian Walde (Mithaldu) Brian Wightman (MidLifeXis) Zaki Mughal (zmughal) mohawk (mohawk2, ETJ) Vikas N Kumar (vikasnkumar) Flavio Poletti (polettix) Salvador Fandiño (salva) Gianni Ceccarelli (dakkar) Pavel Shaydo (zwon, trinitum) Kang-min Liu (劉康民, gugod) Nicholas Shipp (nshp) Juan Julián Merelo Guervós (JJ) Joel Berger (JBERGER) Petr Písař (ppisar) Lance Wicks (LANCEW) Ahmad Fatoum (a3f, ATHREEF) José Joaquín Atria (JJATRIA) Duke Leto (LETO) Shoichi Kaji (SKAJI) Shawn Laffan (SLAFFAN) Paul Evans (leonerd, PEVANS) Håkon Hægland (hakonhagland, HAKONH) nick nauwelaerts (INPHOBIA) =head1 COPYRIGHT AND LICENSE This software is copyright (c) 2011-2020 by Graham Ollis. This is free software; you can redistribute it and/or modify it under the same terms as the Perl 5 programming language system itself. =cut