<?xml version="1.0" encoding="UTF-8"?>
<s:scufl xmlns:s="http://org.embl.ebi.escience/xscufl/0.1alpha" version="0.2" log="0">
  <s:workflowdescription lsid="urn:lsid:net.sf.taverna:wfDefinition:fe6f841e-3148-4f45-b0e7-8d5949faeedd" author="Arnaud Kerhornou" title="Gene prediction Workflow that takes a FASTA sequence." />
  <s:processor name="Decode_base64_to_byte">
    <s:local>org.embl.ebi.escience.scuflworkers.java.DecodeBase64</s:local>
  </s:processor>
  <s:processor name="StringArticleName" boring="true">
    <s:stringconstant>content</s:stringconstant>
  </s:processor>
  <s:processor name="runEmbossPepstatsFromSequence">
    <s:description>Outputs a report of simple protein sequence information.</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>runEmbossPepstatsFromSequence</s:serviceName>
      <s:authorityName>inb.bsc.es</s:authorityName>
      <s:Parameter s:name="to" />
      <s:Parameter s:name="from" />
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="translateGeneIDGFFPredictions">
    <s:description>Translates the GeneID gene predictions, given in GFF format, into a set of aminoacid sequences</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>translateGeneIDGFFPredictions</s:serviceName>
      <s:authorityName>genome.imim.es</s:authorityName>
      <s:Parameter s:name="translation_table">Standard (1)</s:Parameter>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="fromGenericSequenceCollectionToFASTA">
    <s:description>Converts a collection of generic sequences into FASTA sequences</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>fromGenericSequenceCollectionToFASTA</s:serviceName>
      <s:authorityName>genome.imim.es</s:authorityName>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="searchInterPro" boring="true">
    <s:description>Query an Amino Acid sequence against InterPro.</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>searchInterPro</s:serviceName>
      <s:authorityName>inb.bsc.es</s:authorityName>
      <s:Parameter s:name="hmmsmart">no</s:Parameter>
      <s:Parameter s:name="tmhmm">yes</s:Parameter>
      <s:Parameter s:name="seg">yes</s:Parameter>
      <s:Parameter s:name="fprintscan">no</s:Parameter>
      <s:Parameter s:name="hmmpir">no</s:Parameter>
      <s:Parameter s:name="superfamily">no</s:Parameter>
      <s:Parameter s:name="coils">yes</s:Parameter>
      <s:Parameter s:name="gene3d">no</s:Parameter>
      <s:Parameter s:name="scanregexp">no</s:Parameter>
      <s:Parameter s:name="blastprodom">no</s:Parameter>
      <s:Parameter s:name="hmmpfam">no</s:Parameter>
      <s:Parameter s:name="signalp">yes</s:Parameter>
      <s:Parameter s:name="hmmpanther">no</s:Parameter>
      <s:Parameter s:name="profilescan">no</s:Parameter>
      <s:Parameter s:name="hmmtigr">no</s:Parameter>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="runHMMPfam">
    <s:description>Searches a HMM profile database (Pfam) with a query sequence. Use this if you are trying to annotate an unknown sequence.</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>runHMMPfam</s:serviceName>
      <s:authorityName>inb.bsc.es</s:authorityName>
      <s:Parameter s:name="hmm_accessions">on</s:Parameter>
      <s:Parameter s:name="e-value_domain" />
      <s:Parameter s:name="alignment_number">10</s:Parameter>
      <s:Parameter s:name="score_cutoff" />
      <s:Parameter s:name="e-value_score">59021</s:Parameter>
      <s:Parameter s:name="score_cutoff_domain" />
      <s:Parameter s:name="e-value">10.0</s:Parameter>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="fromFASTAToDNASequence">
    <s:description>Converts a DNA FASTA sequence into a DNA sequence</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>fromFASTAToDNASequence</s:serviceName>
      <s:authorityName>genome.imim.es</s:authorityName>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="runGeneIDGFF">
    <s:description>Ab initio gene prediction tool that returns the gene predictions in GFF format (GFF version 2).</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>runGeneIDGFF</s:serviceName>
      <s:authorityName>genome.imim.es</s:authorityName>
      <s:Parameter s:name="strand">Both</s:Parameter>
      <s:Parameter s:name="profile">Homo sapiens (suitable for mammals)</s:Parameter>
      <s:Parameter s:name="engine">Normal</s:Parameter>
      <s:Parameter s:name="signals">None</s:Parameter>
      <s:Parameter s:name="exons">None</s:Parameter>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="runGFF2JPEG">
    <s:description>Runs gff2ps software to vizualize a set of GFF annotations maps. It returns an encoded image in JPEG format.</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>runGFF2JPEG</s:serviceName>
      <s:authorityName>genome.imim.es</s:authorityName>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="Parse_Moby_Data_Pepstats_Text">
    <s:description>Processor to parse the datatype Pepstats_Text</s:description>
    <s:biomobyparser>
      <s:endpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:endpoint>
      <s:datatype>Pepstats_Text</s:datatype>
      <s:articleName>pepstats_report</s:articleName>
      <s:description>Processor to parse the datatype Pepstats_Text</s:description>
    </s:biomobyparser>
  </s:processor>
  <s:processor name="runNCBIBlastp">
    <s:description>Compares a protein sequence against a protein database and calculates the statistical significance of matches using the Basic Local Alignment Tool (BLAST).</s:description>
    <s:biomobywsdl>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>runNCBIBlastp</s:serviceName>
      <s:authorityName>inb.bsc.es</s:authorityName>
      <s:Parameter s:name="database">Swiss-Prot</s:Parameter>
      <s:Parameter s:name="gapalign">true</s:Parameter>
      <s:Parameter s:name="opengap">11</s:Parameter>
      <s:Parameter s:name="matrix">BLOSUM62</s:Parameter>
      <s:Parameter s:name="alignments">15</s:Parameter>
      <s:Parameter s:name="extendgap">2</s:Parameter>
      <s:Parameter s:name="filter">true</s:Parameter>
      <s:Parameter s:name="expected_threshold">0.00001</s:Parameter>
      <s:Parameter s:name="dropoff">0</s:Parameter>
      <s:Parameter s:name="scores">25</s:Parameter>
    </s:biomobywsdl>
  </s:processor>
  <s:processor name="Parse_Moby_Data_GFF">
    <s:description>Processor to parse the datatype GFF</s:description>
    <s:biomobyparser>
      <s:endpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:endpoint>
      <s:datatype>GFF</s:datatype>
      <s:articleName>geneid_predictions</s:articleName>
      <s:description>Processor to parse the datatype GFF</s:description>
    </s:biomobyparser>
  </s:processor>
  <s:processor name="String">
    <s:description>a string</s:description>
    <s:biomobyobject>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>String</s:serviceName>
      <s:authorityName />
    </s:biomobyobject>
  </s:processor>
  <s:processor name="Parse_Moby_Data_b64_encoded_jpeg">
    <s:description>Processor to parse the datatype b64_encoded_jpeg</s:description>
    <s:biomobyparser>
      <s:endpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:endpoint>
      <s:datatype>b64_encoded_jpeg</s:datatype>
      <s:articleName>image</s:articleName>
      <s:description>Processor to parse the datatype b64_encoded_jpeg</s:description>
    </s:biomobyparser>
  </s:processor>
  <s:processor name="FastaSequencObject">
    <s:description>NA sequence in FASTA format</s:description>
    <s:biomobyobject>
      <s:mobyEndpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:mobyEndpoint>
      <s:serviceName>FASTA_NA</s:serviceName>
      <s:authorityName />
    </s:biomobyobject>
  </s:processor>
  <s:processor name="Parse_Moby_Data_BLAST_Text">
    <s:description>Processor to parse the datatype BLAST-Text</s:description>
    <s:biomobyparser>
      <s:endpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:endpoint>
      <s:datatype>BLAST-Text</s:datatype>
      <s:articleName>blast_report</s:articleName>
      <s:description>Processor to parse the datatype BLAST-Text</s:description>
    </s:biomobyparser>
  </s:processor>
  <s:processor name="Parse_Moby_Data_FASTA">
    <s:description>Processor to parse the datatype FASTA</s:description>
    <s:biomobyparser>
      <s:endpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:endpoint>
      <s:datatype>FASTA</s:datatype>
      <s:articleName>sequences</s:articleName>
      <s:description>Processor to parse the datatype FASTA</s:description>
    </s:biomobyparser>
  </s:processor>
  <s:processor name="Parse_Moby_Data_HMMPfam_Report">
    <s:description>Processor to parse the datatype HMMPfam_Report</s:description>
    <s:biomobyparser>
      <s:endpoint>http://moby.ucalgary.ca/moby/MOBY-Central.pl</s:endpoint>
      <s:datatype>HMMPfam_Report</s:datatype>
      <s:articleName>hmmpfam_report</s:articleName>
      <s:description>Processor to parse the datatype HMMPfam_Report</s:description>
    </s:biomobyparser>
  </s:processor>
  <s:link source="Decode_base64_to_byte:bytes" sink="gff_map" />
  <s:link source="FastaSequencObject:mobyData" sink="fromFASTAToDNASequence:FASTA_NA(sequence)" />
  <s:link source="Parse_Moby_Data_BLAST_Text:blast_report_'content'" sink="blastp_report" />
  <s:link source="Parse_Moby_Data_b64_encoded_jpeg:image_'content'" sink="Decode_base64_to_byte:base64" />
  <s:link source="String:mobyData" sink="FastaSequencObject:String(content)" />
  <s:link source="fasta_sequence" sink="String:value" />
  <s:link source="identifier" sink="FastaSequencObject:id" />
  <s:link source="namespace" sink="FastaSequencObject:namespace" />
  <s:link source="StringArticleName:value" sink="String:article name" />
  <s:link source="fromFASTAToDNASequence:DNASequence(sequence)" sink="runGeneIDGFF:DNASequence(sequence)" />
  <s:link source="fromFASTAToDNASequence:DNASequence(sequence)" sink="translateGeneIDGFFPredictions:DNASequence(sequence)" />
  <s:link source="fromGenericSequenceCollectionToFASTA:FASTA(sequences)" sink="Parse_Moby_Data_FASTA:mobyData('FASTA')" />
  <s:link source="runEmbossPepstatsFromSequence:Pepstats_Text(pepstats_report)" sink="Parse_Moby_Data_Pepstats_Text:mobyData('Pepstats_Text')" />
  <s:link source="runGFF2JPEG:b64_encoded_jpeg(image)" sink="Parse_Moby_Data_b64_encoded_jpeg:mobyData('b64_encoded_jpeg')" />
  <s:link source="runGeneIDGFF:GFF(geneid_predictions)" sink="Parse_Moby_Data_GFF:mobyData('GFF')" />
  <s:link source="runGeneIDGFF:GFF(geneid_predictions)" sink="runGFF2JPEG:GFF(Collection - 'maps')" />
  <s:link source="runGeneIDGFF:GFF(geneid_predictions)" sink="translateGeneIDGFFPredictions:GFF(geneid_predictions)" />
  <s:link source="runHMMPfam:HMMPfam_Report(hmmpfam_report)" sink="Parse_Moby_Data_HMMPfam_Report:mobyData('HMMPfam_Report')" />
  <s:link source="runNCBIBlastp:BLAST-Text(blast_report)" sink="Parse_Moby_Data_BLAST_Text:mobyData('BLAST-Text')" />
  <s:link source="translateGeneIDGFFPredictions:AminoAcidSequence(Collection - 'peptides' As Simples)" sink="runEmbossPepstatsFromSequence:AminoAcidSequence(sequence)" />
  <s:link source="translateGeneIDGFFPredictions:AminoAcidSequence(Collection - 'peptides' As Simples)" sink="runHMMPfam:AminoAcidSequence(sequence)" />
  <s:link source="translateGeneIDGFFPredictions:AminoAcidSequence(Collection - 'peptides' As Simples)" sink="runNCBIBlastp:AminoAcidSequence(sequence)" />
  <s:link source="translateGeneIDGFFPredictions:AminoAcidSequence(Collection - 'peptides' As Simples)" sink="searchInterPro:AminoAcidSequence(sequence)" />
  <s:link source="translateGeneIDGFFPredictions:AminoAcidSequence(Collection - 'peptides')" sink="fromGenericSequenceCollectionToFASTA:GenericSequence(Collection - 'sequences')" />
  <s:link source="Parse_Moby_Data_FASTA:sequences_'content'" sink="peptide_sequences" />
  <s:link source="Parse_Moby_Data_GFF:geneid_predictions_'content'" sink="geneid_gff_predictions" />
  <s:link source="Parse_Moby_Data_HMMPfam_Report:hmmpfam_report_'Alignments'_'content'" sink="motif_alignments" />
  <s:link source="Parse_Moby_Data_HMMPfam_Report:hmmpfam_report_'Sequences'" sink="pfam_report" />
  <s:link source="Parse_Moby_Data_Pepstats_Text:pepstats_report_'content'" sink="pepStats" />
  <s:link source="searchInterPro:InterProMotifAnnotatedAASequence(iprscan_report)" sink="interproscan_report_debugging" />
  <s:source name="identifier" />
  <s:source name="namespace" />
  <s:source name="fasta_sequence" />
  <s:sink name="peptide_sequences" />
  <s:sink name="gff_map">
    <s:metadata>
      <s:mimeTypes>
        <s:mimeType>image/*</s:mimeType>
      </s:mimeTypes>
    </s:metadata>
  </s:sink>
  <s:sink name="geneid_gff_predictions" />
  <s:sink name="pepStats" />
  <s:sink name="blastp_report" />
  <s:sink name="interproscan_report_debugging" />
  <s:sink name="pfam_report" />
  <s:sink name="motif_alignments" />
</s:scufl>

