/usr/share/perl5/HTML/RewriteAttributes.pm is in libhtml-rewriteattributes-perl 0.05-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 | #!/usr/bin/env perl
package HTML::RewriteAttributes;
use strict;
use warnings;
use base 'HTML::Parser';
use Carp 'croak';
use HTML::Entities 'encode_entities';
our $VERSION = '0.05';
sub new {
my $class = shift;
return $class->SUPER::new(
start_h => [ '_start_tag', "self,tagname,attr,attrseq,text" ],
default_h => [ '_default', "self,tagname,attr,text" ],
);
}
sub rewrite {
my $self = shift;
$self = $self->new if !ref($self);
$self->_rewrite(@_);
}
sub _rewrite {
my $self = shift;
my $html = shift;
my $cb = shift || sub { $self->rewrite_resource(@_) };
$self->_begin_rewriting($cb);
$self->parse($html);
$self->eof;
$self->_done_rewriting;
return $self->{rewrite_html};
}
sub rewrite_resource {
my $self = shift;
my $class = ref($self) || $self;
my $error = "You must specify a callback to $class->rewrite";
$error .= " or define $class->rewrite_resource" if $class ne __PACKAGE__;
croak "$error.";
}
sub _begin_rewriting {
my $self = shift;
my $cb = shift;
$self->{rewrite_html} = '';
$self->{rewrite_callback} = $cb;
}
sub _done_rewriting { }
sub _should_rewrite { 1 }
sub _start_tag {
my ($self, $tag, $attrs, $attrseq, $text) = @_;
$self->{rewrite_html} .= "<$tag";
for my $attr (@$attrseq) {
next if $attr eq '/';
if ($self->_should_rewrite($tag, $attr)) {
$attrs->{$attr} = $self->_invoke_callback($tag, $attr, $attrs->{$attr});
next if !defined($attrs->{$attr});
}
$self->{rewrite_html} .= sprintf ' %s="%s"',
$attr,
encode_entities($attrs->{$attr});
}
$self->{rewrite_html} .= ' /' if $attrs->{'/'};
$self->{rewrite_html} .= '>';
}
sub _default {
my ($self, $tag, $attrs, $text) = @_;
$self->{rewrite_html} .= $text;
}
sub _invoke_callback {
my $self = shift;
my ($tag, $attr, $value) = @_;
return $self->{rewrite_callback}->($tag, $attr, $value);
}
1;
__END__
=head1 NAME
HTML::RewriteAttributes - concise attribute rewriting
=head1 SYNOPSIS
$html = HTML::RewriteAttributes->rewrite($html, sub {
my ($tag, $attr, $value) = @_;
# delete any attribute that mentions..
return if $value =~ /COBOL/i;
$value =~ s/\brocks\b/rules/g;
return $value;
});
# writing some HTML email I see..
$html = HTML::RewriteAttributes::Resources->rewrite($html, sub {
my $uri = shift;
my $content = render_template($uri);
my $cid = generate_cid_from($content);
$mime->attach($cid => content);
return "cid:$cid";
});
# up for some HTML::ResolveLink?
$html = HTML::RewriteAttributes::Links->rewrite($html, "http://search.cpan.org");
# or perhaps HTML::LinkExtor?
HTML::RewriteAttributes::Links->rewrite($html, sub {
my ($tag, $attr, $value) = @_;
push @links, $value;
$value;
});
=head1 DESCRIPTION
C<HTML::RewriteAttributes> is designed for simple yet powerful HTML attribute
rewriting.
You simply specify a callback to run for each attribute and we do the rest
for you.
This module is designed to be subclassable to make handling special cases
eaiser. See the source for methods you can override.
=head1 METHODS
=head2 C<new>
You don't need to call C<new> explicitly - it's done in L</rewrite>. It takes
no arguments.
=head2 C<rewrite> HTML, callback -> HTML
This is the main interface of the module. You pass in some HTML and a callback,
the callback is invoked potentially many times, and you get back some similar
HTML.
The callback receives as arguments the tag name, the attribute name, and the
attribute value (though subclasses may override this --
L<HTML::RewriteAttributes::Resources> does). Return C<undef> to remove the
attribute, or any other value to set the value of the attribute.
=head1 SEE ALSO
L<HTML::Parser>, L<HTML::ResolveLink>, L<Email::MIME::CreateHTML>,
L<HTML::LinkExtor>
=head1 THANKS
Some code was inspired by, and tests borrowed from, Miyagawa's
L<HTML::ResolveLink>.
=head1 AUTHOR
Shawn M Moore, C<< <sartak@bestpractical.com> >>
=head1 LICENSE
Copyright 2008-2010 Best Practical Solutions, LLC.
HTML::RewriteAttributes is distributed under the same terms as Perl itself.
=cut
|