——————————#
# BioPerl module for Bio::Tools::Run::EMBOSSApplication
#
# Copyright Heikki Lehvaslaiho
#
# You may distribute this module under the same terms as perl itself
# POD documentation - main docs before the code
=head1 NAME
Bio::Tools::Run::EMBOSSApplication - class for EMBOSS Applications
=head1 SYNOPSIS
# Get an EMBOSS factory
use Bio::Factory::EMBOSS;
$f = Bio::Factory::EMBOSS -> new();
# Get an EMBOSS application object from the factory
$water = $f->program('water') || die "Program not found!\n";
# Here is an example of running the application - water can
# compare 1 sequence against 1 or more sequences using Smith-Waterman.
# Pass a Sequence object and a reference to an array of objects.
my $wateroutfile = 'out.water';
$water->run({-asequence => $seq_object,
-bsequence => \@seq_objects,
-gapopen => '10.0',
-gapextend => '0.5',
-outfile => $wateroutfile});
# Now you might want to get the alignment
use Bio::AlignIO;
my $alnin = Bio::AlignIO->new(-format => 'emboss',
-file => $wateroutfile);
while ( my $aln = $alnin->next_aln ) {
# process the alignment -- these will be Bio::SimpleAlign objects
}
=head1 DESCRIPTION
The EMBOSSApplication class can represent any EMBOSS program. It is
created by a L<Bio::Factory::EMBOSS> object.
If you want to check command line options before sending them to the
program set $prog-E<gt>verbose to positive integer. The ADC
description of the available command line options is then parsed in
and compared to input.
See also L<Bio::Factory::EMBOSS> and L<Bio::Tools::Run::EMBOSSacd>.
=head1 FEEDBACK
=head2 Mailing Lists
User feedback is an integral part of the evolution of this and other
Bioperl modules. Send your comments and suggestions preferably to the
Bioperl mailing lists Your participation is much appreciated.
bioperl-l@bioperl.org - General discussion
http://bioperl.org/wiki/Mailing_lists - About the mailing lists
=head2 Support
Please direct usage questions or support issues to the mailing list:
I<bioperl-l@bioperl.org>
rather than to the module maintainer directly. Many experienced and
reponsive experts will be able look at the problem and quickly
address it. Please include a thorough description of the problem
with code and data examples if at all possible.
=head2 Reporting Bugs
Report bugs to the Bioperl bug tracking system to help us keep track
the bugs and their resolution. Bug reports can be submitted via the
web:
=head1 AUTHOR - Heikki Lehvaslaiho
Email heikki-at-bioperl-dot-org
=head2 CONTRIBUTORS
Email: jason-AT-bioperl_DOT_org
=head1 APPENDIX
The rest of the documentation details each of the object
methods. Internal methods are usually preceded with a _
=cut
# Let the code begin...
package
Bio::Tools::Run::EMBOSSApplication;
use
strict;
use
Data::Dumper;
sub
new {
my
(
$class
,
$args
) =
@_
;
my
$self
=
$class
->SUPER::new();
$self
->name(
$args
->{
'name'
});
$self
->verbose(
$args
->{
'verbose'
});
$self
->acd
if
$self
->verbose > 0;
return
$self
;
}
=head2 run
Title : run
Usage : $embossapplication->run($attribute_hash)
Function: Runs the EMBOSS program.
Returns : string or creates files for now; will return objects!
Args : hash of input to the program
=cut
sub
run {
my
(
$self
,
$input
) =
@_
;
$self
->io->_io_cleanup();
# test input
$self
->debug( Dumper(
$input
) );
# parse ACD information
$self
->acd
if
$self
->verbose > 0;
# collect the options into a string
my
$option_string
=
''
;
foreach
my
$attr
(
keys
%{
$input
}) {
my
$attr_name
=
substr
(
$attr
, 1)
if
substr
(
$attr
, 0, 1) =~ /\W/;
my
$array
= 0;
if
(
defined
$input
->{
$attr
} &&
ref
(
$input
->{
$attr
}) ) {
my
(
@pieces
);
if
(
$array
= (
ref
(
$input
->{
$attr
}) =~ /array/i) ) {
foreach
my
$s
( @{
$input
->{
$attr
}} ) {
@pieces
= @{
$input
->{
$attr
}};
}
}
else
{
@pieces
= (
$input
->{
$attr
});
}
if
( !
defined
$pieces
[0] ) {
# we ignore for now
$self
->
warn
(
"specified a parameter $attr with no value"
);
$input
->{
$attr
} =
undef
;
return
;
}
elsif
(
$pieces
[0]->isa(
'Bio::PrimarySeqI'
) ) {
unless
(
$SEQIOLOADED
) {
$SEQIOLOADED
= 1;
}
my
(
$tfh
,
$tempfile
) =
$self
->io->tempfile(
-dir
=>
$self
->tempdir);
my
$out
= Bio::SeqIO->new(
-format
=>
'fasta'
,
-fh
=>
$tfh
);
foreach
my
$seq
(
@pieces
) {
$out
->write_seq(
$seq
);
}
$out
->
close
();
$input
->{
$attr
} =
$tempfile
;
close
(
$tfh
);
undef
$tfh
;
}
elsif
(
$pieces
[0]->isa(
'Bio::Align::AlignI'
) ) {
unless
(
$ALIGNIOLOADED
) {
$ALIGNIOLOADED
= 1;
}
my
(
$tfh
,
$tempfile
) =
$self
->io->tempfile();
my
$out
= Bio::AlignIO->new(
-format
=>
'msf'
,
-fh
=>
$tfh
);
foreach
my
$p
(
@pieces
) {
$out
->write_aln(
$p
);
}
$input
->{
$attr
} =
$tempfile
;
close
(
$tfh
);
undef
$tfh
;
}
}
# check each argument against ACD
if
(
$self
->verbose > 0) {
last
unless
defined
$self
->acd;
# might not have the parser
$self
->throw(
"Attribute [$attr] not recognized!\n"
)
unless
$self
->acd->qualifier(
$attr
);
}
# print out debugging info
$self
->debug(
"Input attr: "
.
$attr_name
.
" => "
.
$input
->{
$attr
}.
"\n"
);
$option_string
.=
" "
.
$attr
;
$option_string
.=
" "
.
$input
->{
$attr
}
if
defined
$input
->{
$attr
};
}
# check mandatory attributes against given ones
if
(
$self
->verbose > 0) {
last
unless
defined
$self
->acd;
# might not have the parser
# $self->acd->mandatory->print;
# if ($self->name eq 'water') {
# print Dumper($self->acd->mandatory);
# }
foreach
my
$attr
(
keys
%{
$self
->acd->mandatory} ) {
last
unless
defined
$self
->acd;
# might not have the parser
unless
(
defined
$input
->{
$attr
}) {
"-"
x 38,
"\n"
,
"MISSING MANDATORY ATTRIBUTE: $attr\n"
,
"-"
x 38,
"\n"
;
$self
->acd->
(
$attr
) and
$self
->throw(
"Program "
.
$self
->name.
" needs attribute [$attr]!\n"
)
}
}
}
my
$runstring
=
join
(
' '
,
$self
->name,
$option_string
,
'-auto'
);
$self
->debug(
"Command line: "
,
$runstring
,
"\n"
);
return
`
$runstring
`;
}
=head2 acd
Title : acd
Usage : $embossprogram->acd
Function: finds out all the possible qualifiers for this
EMBOSS application. They can be used to debug the
options given.
Throws :
Returns : boolean
Args :
=cut
sub
acd {
my
(
$self
) =
@_
;
unless
(
$self
->{
'_acd'
} ) {
$self
->{
'_acd'
} =
Bio::Tools::Run::EMBOSSacd->new(
$self
->name);
}
return
$self
->{
'_acd'
};
}
=head2 name
Title : name
Usage : $embossprogram->name
Function: sets/gets the name of the EMBOSS program
Setting is done by the EMBOSSFactory object,
you should only get it.
Throws :
Returns : name string
Args : None
=cut
sub
name {
my
(
$self
,
$value
) =
@_
;
if
(
defined
$value
) {
$self
->{
'_name'
} =
$value
;
}
return
$self
->{
'_name'
};
}
=head2 descr
Title : descr
Usage : $embossprogram->descr
Function: sets/gets the descr of the EMBOSS program
Setting is done by the EMBOSSFactory object,
you should only get it.
Throws :
Returns : description string
Args : None
=cut
sub
descr {
my
(
$self
,
$value
) =
@_
;
if
(
defined
$value
) {
$self
->{
'_descr'
} =
$value
;
}
return
$self
->{
'_descr'
};
}
=head2 group
Title : group
Usage : $embossprogram->group
Function: sets/gets the group of the EMBOSS program
Setting is done by the EMBOSSFactory object,
you should only get it.
If the application is assigned into a subgroup
use l<subgroup> to get it.
Throws :
Returns : string, group name
Args : group string
=cut
sub
group {
my
(
$self
,
$value
) =
@_
;
if
(
defined
$value
) {
my
(
$group
,
$subgroup
) =
split
':'
,
$value
;
$self
->{
'_group'
} =
$group
;
$self
->{
'_subgroup'
} =
$subgroup
;
}
return
$self
->{
'_group'
};
}
=head2 subgroup
Title : subgroup
Usage : $embossprogram->subgroup
Function: sets/gets the subgroup of the EMBOSS program
Setting is done by the EMBOSSFactory object,
you should only get it.
Throws :
Returns : string, subgroup name; undef if not defined
Args : None
=cut
sub
subgroup {
my
(
$self
) =
@_
;
return
$self
->{
'_subgroup'
};
}
=head2 program_dir
Title : program_dir
Usage :
Function: Required by WrapperBase
Throws :
Returns : Name of directory with EMBOSS programs
Args :
=cut
sub
program_dir {
return
Bio::Root::IO->catfile(
$ENV
{EMBOSS_ACDROOT});
}
=head2 program_path
Title : program_path
Usage :
Function: Required by WrapperBase
Throws :
Returns : Full path of program
Args :
=cut
sub
program_path {
my
$self
=
shift
;
my
$name
=
$self
->{_name};
my
$dir
= Bio::Root::IO->catfile(
$ENV
{EMBOSS_ACDROOT});
return
"$dir/$name"
;
}
=head2 executable
Title : executable
Usage :
Function: Required by WrapperBase
Throws :
Returns : Name of program
Args :
=cut
sub
executable {
my
$self
=
shift
;
$self
->{_name};
}
1;