use strict;
use Digest::MD5 qw(md5_hex);
=head1 NAME
SWISH::Filters::ImageToMD5Xml - Adds MD5 information when filtering an image for SWISHE.
=head1 VERSION
Version 0.04
our $VERSION = '0.05';
A L<SWISH::Filter> that takes an incoming image XML and applies a MD5 checksum
against the binary content of the image.
The XML structure this filter expects includes an C<b64_data> element containing
the Base64 string representing the image. If that element (tag) is not found,
no filter is applied.
=head1 METHODS
=head2 new ( $class )
sub new {
my ( $class ) = @_;
$class = ref $class || $class;
my $self = bless { }, $class;
return $self->_init;
sub _init {
my ( $self ) = @_;
$self->use_modules(qw/MIME::Base64 Search::Tools::XML XML::Simple/);
my @mimetypes = (
$self->{mimetypes} = \@mimetypes;
return $self;
sub _parse_xml {
my ( $self, $xml ) = @_;
if ( $xml ) {
return XMLin($xml);
=head2 filter( $self, $doc )
Generates XML meta data for indexing. If I<$doc> contains the C<b64_data> element (tag)
then a MD5 checksum string will be added to the XML and returned with a new root element C<image_data>.
sub filter {
my ( $self, $doc ) = @_;
return if $doc->is_binary;
if ( my $xml = $doc->fetch_filename ) {
if ( my $ds = $self->_parse_xml($xml) ) {
return unless exists $ds->{b64_data};
$ds->{md5} = md5_hex($ds->{b64_data});
my $xml = Search::Tools::XML->perl_to_xml($ds, { root => 'image_data' });
return ( \$xml );
=head1 AUTHOR
Logan Bell, C<< <loganbell at> >>
1; # End of SWISH::Filters::ImageToMD5Xml