diff --git a/docs/quantification/transcriptome/EXPv1.xml b/docs/quantification/transcriptome/EXPv1.xml
new file mode 100644
index 0000000..a18b242
--- /dev/null
+++ b/docs/quantification/transcriptome/EXPv1.xml
@@ -0,0 +1,146 @@
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/css" href="http://deep.mpi-inf.mpg.de/DAC/files/style/deep_process_style.css"?>
+<process>
+    <name>EXP</name>
+	<version>1</version>
+	<author>
+		<name>Matthias Barann</name>
+		<email>m.barann@ikmb.uni-kiel.de</email>
+	</author>
+    <description>
+		* bam2wig.py: Conversion of BAM file to BigWig coverage tracks. One track per strand will be generated.
+		* htseq-count: Generates read counts on the gene level.
+		* cufflinks: Generates FPKM values for genes and transcript isoforms.
+	</description>
+	<inputs>
+		<filetype>
+			<identifier>.bam</identifier>
+			<format></format>
+			<quantity>single</quantity>
+			<comment>Unfiltered aligned reads</comment>
+		</filetype>
+		<filetype>
+			<identifier>.bai</identifier>
+			<format></format>
+			<quantity>single</quantity>
+			<comment>Index file to bam file</comment>
+		</filetype>
+	</inputs>
+	<references>
+		<filetype>
+			<identifier>chromInfo.txt</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>Tab delimited file containing the name and length of the reference sequences: [name][tab][length].</comment>
+		</filetype>
+		<filetype>
+			<identifier>gencode.v19.annotation.gtf</identifier>
+			<format>GTF</format>
+			<quantity>single</quantity>
+			<comment>Gencode gene annotation file in gene transfer format.</comment>
+		</filetype>
+		<filetype>
+			<identifier>reference.fa</identifier>
+			<format>multi fasta</format>
+			<quantity>single</quantity>
+			<comment>The reference genome file; see aspera.dkfz.de > download > results > references > genomes > human > WholeGenome</comment>
+		</filetype>
+	</references>
+	<outputs>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].bamcov.Forward.wig</identifier>
+			<format>wiggle</format>
+			<quantity>single</quantity>
+			<comment>Forward strand wiggle file. Usually it is not necessary to keep this file.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].bamcov.Reverse.wig</identifier>
+			<format>wiggle</format>
+			<quantity>single</quantity>
+			<comment>Reverse strand wiggle file Usually it is not necessary to keep this file.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].bamcov.Forward.bw</identifier>
+			<format>BigWig</format>
+			<quantity>single</quantity>
+			<comment>Forward strand BigWig file. This file will only be generated if the UCSC program bamToBigWig can be found in $PATH.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].bamcov.Reverse.bw</identifier>
+			<format>BigWig</format>
+			<quantity>single</quantity>
+			<comment>Reverse strand BigWig file. This file will only be generated if the UCSC program bamToBigWig can be found in $PATH.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].readcounts.txt</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>This file contains the read counts on the gene level.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].genes.fpkm.tracking</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>Output file containing the FPKM counts on the gene level.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].isoforms.fpkm.tracking</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>Output file containing the FPKM counts on the isoform level.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].EXPv1.[DATE].transcripts.gtf</identifier>
+			<format>gene transfer format</format>
+			<quantity>single</quantity>
+			<comment>This file contains assembled transcripts.</comment>
+		</filetype>
+	</outputs>
+	<software>
+		<tool>
+			<name>Python</name>
+			<version>2.7</version>
+			<command_line><![CDATA[ CMDLINE ]]></command_line>
+			<loop>no looping</loop>
+			<comment></comment>
+		</tool>
+		<tool>
+			<name>Samtools</name>
+			<version>0.1.19-44428cd</version>
+			<command_line><![CDATA[ CMDLINE ]]></command_line>
+			<loop>no looping</loop>
+			<comment></comment>
+		</tool>
+		<tool>
+			<name>bam2wig.py</name>
+			<version>2.3.9</version>		
+			<command_line><![CDATA[ python bam2wig.py -i ${sample}.bam -s ChromInfo.txt -o ${_sample} -d "1+-,1-+,2++,2--" ]]></command_line>
+            <loop>no looping</loop>
+			<comment>The python script is part of the RSeQC software. It will convert a bam file into two wig files (one for each strand). \
+			If the UCSC program wigToBigWig can be located by the python script, the generated wig files will automatically be converted to bigWig. \
+			Please note that for some samples the wigToBigWig command might exit with errors. In this case, manually invoking the wigToBigWig \
+			command on the generated wig files can solve the problem: \
+			wigToBigWig ${_sample}_Forward.wig -s ChromInfo.txt > ${_sample}_Forward.bw</comment>
+		</tool>
+		<tool>
+			<name>htseq-count</name>
+			<version>0.5.4p3</version>		
+			<command_line><![CDATA[ samtools sort -n -@ 8 -m 4G ${_sample}.bam ${_sample}_sorted
+			samtools/samtools view -F 256 ${_sample}_sorted.bam > ${_sample}.sam
+			htseq-count -s reverse  -m intersection-strict -a 20 ${_sample}.sam gencode.v19.annotation.gtf > ${_sample}_htseq.txt ]]>
+			</command_line>
+            <loop>no looping</loop>
+			<comment>DESeq requires bam files sorted by read name (step 1). After sorting, all non-primary alignments are removed during the bam to sam conversion. \
+			Invoking htseq-count counts the number of reads per gene. Using the mode 'intersection-strict' results in a rather conservative read count. \
+			Please see http://www-huber.embl.de/users/anders/HTSeq/doc/count.html#count for further information.</comment>
+		</tool>
+		<tool>
+			<name>cufflinks</name>
+			<version>v2.0.2</version>		
+			<command_line><![CDATA[ cufflinks -p 8 --frag-bias-correct reference.fa --multi-read-correct --library-type fr-firststrand --compatible-hits-norm -G gencode.v19.annotation_transcripts_only.gtf ${_sample}.bam ]]>
+			</command_line>
+            <loop>no looping</loop>
+			<comment>Please see http://cufflinks.cbcb.umd.edu/manual.html for further information.</comment>
+		</tool>
+	</software>
+</process>	
diff --git a/docs/quantification/transcriptome/LXPv1.xml b/docs/quantification/transcriptome/LXPv1.xml
new file mode 100644
index 0000000..5177b5f
--- /dev/null
+++ b/docs/quantification/transcriptome/LXPv1.xml
@@ -0,0 +1,135 @@
+<?xml version="1.0"?>
+<process>
+	<name>LXP</name>
+	<version>1</version>
+	<author>
+		<name>Anupam Sinha</name>
+		<email>a.sinha@ikmb.uni-kiel.de</email>
+	</author>
+	<!-- Precise description of what this process does, what output is generated and what statistics are computed -->
+	<description>
+		* htseq-count: Generates read counts on the gene level.
+		* cufflinks: Generates FPKM values for genes and transcript isoforms.
+		* StringTie: Generates FPKM values for genes and transcript isoforms. Also generates .ctab files for analysis using Ballgown.
+	</description>
+	<!-- Following section: list input files [samples to be analysed and similar] -->
+	<inputs>
+		<filetype>
+			<identifier>.bam</identifier>
+			<format></format>
+			<quantity>single</quantity>
+			<comment>Unfiltered aligned reads</comment>
+		</filetype>
+	</inputs>
+	<!-- Following section: list reference files [e.g. reference genomes] used in this process -->
+	<references>
+		<filetype>
+			<identifier>gencode.v19.annotation.gtf</identifier>
+			<format>GTF</format>
+			<quantity>single</quantity>
+			<comment>Gencode gene annotation file in gene transfer format.</comment>
+		</filetype>
+		<filetype>
+			<identifier>reference.fa</identifier>
+			<format>multi fasta</format>
+			<quantity>single</quantity>
+			<comment>The reference genome file; see aspera.dkfz.de > download > results > references > genomes > human > WholeGenome</comment>
+		</filetype>
+	</references>
+	<!-- Following section: list output files of process [e.g. fpkm files, read counts files from htseq etc.] -->
+	<outputs>
+		<filetype>
+			<identifier>[sampleID].LXPv1.[DATE].readcounts.txt</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>This file contains the read counts on the gene level.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].LXPv1.[DATE].genes.fpkm.tracking</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>Output file containing the FPKM counts on the gene level.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].LXPv1.[DATE].isoforms.fpkm.tracking</identifier>
+			<format>text file</format>
+			<quantity>single</quantity>
+			<comment>Output file containing the FPKM counts on the isoform level.</comment>
+		</filetype>
+		<filetype>
+			<identifier>[sampleID].LXPv1.[DATE].transcripts.gtf</identifier>
+			<format>gene transfer format</format>
+			<quantity>single</quantity>
+			<comment>This file contains assembled transcripts.</comment>
+		</filetype>
+		<filetype>
+                        <identifier>[sampleID].LXPv1.[DATE].stringtie.gtf</identifier>
+                        <format>gene transfer format</format>
+                        <quantity>single</quantity>
+                        <comment>This file contains assembled transcripts.</comment>
+                </filetype>
+		<filetype>
+                        <identifier>[sampleID].LXPv1.[DATE].ballgown</identifier>
+                        <format>tab separated fields (.ctab) format</format>
+                        <quantity>five</quantity>
+                        <comment>This is a folder containing 5 .ctab files. These .ctab files contain the expression values of exons, introns and transcripts. Two files list the internal(generated by ballgown) association ids between exons, introns, and transcripts.</comment>
+                </filetype>
+	</outputs>
+
+	<software>
+		<tool>
+			<name>Python</name>
+			<version>2.7</version>
+			<command_line><![CDATA[ CMDLINE ]]></command_line>
+			<loop>no looping</loop>
+			<comment></comment>
+		</tool>
+		<tool>
+			<name>Samtools</name>
+			<version>0.1.19-44428cd</version>
+			<command_line><![CDATA[ CMDLINE ]]></command_line>
+			<loop>no looping</loop>
+			<comment></comment>
+		</tool>
+		<tool>
+			<name>htseq-count</name>
+			<version>0.6.1p1</version>		
+			<command_line>samtools sort -n -@ 8 -m 4G ${_sample}.bam ${_sample}_sorted
+			samtools/samtools view -F 256 ${_sample}_sorted.bam > ${_sample}.sam
+			htseq-count -s reverse -m union -a 20 ${_sample}.sam gencode.v19.annotation.gtf > ${_sample}_htseq.txt
+			</command_line>
+			<loop>no looping</loop>
+			<comment>DESeq2 requires bam files sorted by read name (step 1). After sorting, all non-primary alignments are removed during the bam to sam conversion. \
+			Invoking htseq-count counts the number of reads per gene.  \
+			Please see http://www-huber.embl.de/users/anders/HTSeq/doc/count.html#count for further information.
+			</comment>
+		</tool>
+		<tool>
+			<name>cufflinks</name>
+			<version>v2.0.2</version>		
+			<command_line>
+				<![CDATA[
+					cufflinks -p 16 --frag-bias-correct reference.fa --multi-read-correct --library-type fr-firststrand
+					--compatible-hits-norm -G gencode.v19.annotation_transcripts_only.gtf ${_sample}.bam
+				]]>
+			</command_line>
+			<loop>no looping</loop>
+			<comment>Please see http://cufflinks.cbcb.umd.edu/manual.html for further information.</comment>
+		</tool>
+		<tool>
+			<name>StringTie</name>
+			<version>v1.0.3</version>
+			<command_line>
+				<![CDATA[
+					stringtie -p 16 -e -b ${_sample}.ballgown -o ${_sample}_stringtie.gtf -G gencode.v19.annotation_transcripts_only.gtf
+				]]>
+            </command_line>
+			<loop>no looping</loop>
+			<comment>Please see http://ccb.jhu.edu/software/stringtie/ for further information. \
+			"-b" option creates a folder which contains the .ctab files for analysis using Ballgown. \
+			Please see https://github.com/alyssafrazee/ballgown for further information.
+			</comment>
+		</tool>
+
+	</software>
+</process>	
diff --git a/docs/quantification/transcriptome/SXPv1.xml b/docs/quantification/transcriptome/SXPv1.xml
new file mode 100644
index 0000000..589091e
--- /dev/null
+++ b/docs/quantification/transcriptome/SXPv1.xml
@@ -0,0 +1,207 @@
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/css" href="http://deep.mpi-inf.mpg.de/DAC/files/style/deep_process_style.css"?>
+<process>
+    <name>SXP</name>
+	<version>1</version>
+	<author>
+		<name>Filippos Klironomos</name>
+		<email>filippos.klironomos@mdc-berlin.de</email>
+	</author>
+	<description>
+    *) miRDeep2 pipeline involves:
+      *) mapping of reads to genome and keeping those uniquely mapped
+      *) extracting bracketing DNA of the uniquely mapped reads
+      *) RNAfold extracted sequences and keeping those that form unbifurcated hairpins
+      *) scoring putative precursors:
+         *) expect greater number of reads mapping to either the -5p or -3p strand and very little to the hairpin
+         *) short 3&apos; duplex overhang characteristic of Drosha/Dicer processing adds to the score
+         *) relative and absolute stabilities contribute to the score
+         *) if 5&apos; end of mature sequence is identical to that of known mature sequence it adds to the score
+      *) randomly permuting read signatures with putative precursor sequences in order to determine the FPR
+    Internally miRDeep2 uses the following packages:
+    RNAfold version 2.1.7
+    RANDFOLD version 2
+	</description>
+	<inputs>
+		<filetype>
+      <identifier>config</identifier>
+			<format>TSV</format>
+      <quantity>single</quantity>
+      <comment>
+        this is the configuration file that miRDeep2 uses to locate the FASTQ library and assign the 3-character identification to it
+      </comment>
+		</filetype>
+	</inputs>
+	<references>
+		<filetype>
+			<identifier>genome</identifier>
+			<format>fasta</format>
+			<quantity>single</quantity>
+      <comment>
+        hs37d5 and GRCm38mm10 genomes are modified as follows:
+          *) IDs are simplified, everything to the right of the first white space encountered is removed,
+          *) all ambiguously called nucleotides [URYSWKMBDHV] have been masked to &quot;N&quot;.
+        The following script does all this:
+        <![CDATA[
+          sed -e 's/^>\(\S\+\)\s.*$/>\1/' -e '/^[^>]/s/[UuRrYySsWwKkMmBbDdHhVv]/N/g' hs37d5.fa > hs37d5_simple.fa
+          sed -e 's/^>\(\S\+\)\s.*$/>\1/' -e '/^[^>]/s/[UuRrYySsWwKkMmBbDdHhVv]/N/g' GRCm38mm10.fa > GRCm38mm10_simple.fa
+        ]]>
+      </comment>
+		</filetype>
+		<filetype>
+			<identifier>genome_index</identifier>
+			<format>bowtie-index</format>
+			<quantity>collection</quantity>
+      <comment>
+  	    bowtie version 0.12.7 index of hs37d5_simple.fa and GRCm38mm10_simple.fa generated as follows:
+          bowtie-build -f hs37d5_simple.fa hs37d5_simple.fa
+          bowtie-build -f GRCm38mm10_simple.fa GRCm38mm10_simple.fa
+      </comment>
+		</filetype>
+		<filetype>
+			<identifier>miRBase_mature</identifier>
+			<format>fasta</format>
+			<quantity>single</quantity>
+			<comment>mature known miRNA reference from miRBase Release 20 uploaded to ASPERA</comment>
+		</filetype>
+		<filetype>
+			<identifier>miRBase_hairpin</identifier>
+			<format>fasta</format>
+			<quantity>single</quantity>
+			<comment>precursor (hairpin) known miRNA reference from miRBase Release 20 uploaded to ASPERA</comment>
+		</filetype>
+	</references>
+	<outputs>
+		<filetype>
+      <identifier>SampleID.SXPv1.DATE.known.csv</identifier>
+			<format>csv</format>
+			<quantity>single</quantity>
+      <comment>
+        expression of known miRNAs quantified by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv1.DATE.known.bed</identifier>
+			<format>bed</format>
+			<quantity>single</quantity>
+      <comment>
+        BED track of expression of known miRNAs quantified by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv1.DATE.known.bedGraph</identifier>
+			<format>bedGraph</format>
+			<quantity>single</quantity>
+      <comment>
+        bedGraph track of expression of known miRNAs quantified by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv1.DATE.novel.bed</identifier>
+			<format>bed</format>
+			<quantity>single</quantity>
+      <comment>
+        bed track of expression of novel miRNAs predicted by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv1.DATE.novel.bedGraph</identifier>
+			<format>bedGraph</format>
+			<quantity>single</quantity>
+      <comment>
+        bedGraph track of expression of novel miRNAs predicted by miRDeep2
+      </comment>
+		</filetype>
+	</outputs>
+	<software>
+		<tool>
+            <name>generate_config</name>
+			<version>missing</version>
+            <command_line>
+            <![CDATA[ echo -ne "{SampleID.fastq}\tID1\n" > config ]]>
+            </command_line>
+            <loop>no looping</loop>
+            <comment>
+            this command creates the configuration file for miRDeep2 to use in order to locate the FASTQ library {SampleID.fastq} and assign
+            a 3-letter internal ID to it, in this case ID1
+            </comment>
+		</tool>
+		<tool>
+		    <name>mapper.pl</name>
+			<version>miRDeep2.0.0.6</version>
+            <command_line>
+            <![CDATA[ mapper.pl config -d -e -h -j -k {Adaptor} -l 18 -m -p {genome_index} -s reads_collapsed.fa -t reads_vs_genome.arf -v -o 12  &> mapper_summary.log ]]>
+            </command_line>
+            <loop>no looping</loop>
+            <comment>
+                use the configuration file to locate the library; remove adaptor provided by {Adaptor};
+                collapse the reads to the file &quot;read_collapsed.fa&quot;;
+                map to the reference and output the alignments in the file &quot;reads_vs_genome.arf&quot;;
+                print out summary in &quot;mapper_summary.log&quot;
+
+                The ARF is a text-based format consisting of the following columns:
+
+                  readID  #  the ID of the read
+                  readLength  #  length of the read
+                  start  #  start position of the alignment relative to the read
+                  end  #  end position of the alignment relative to the read
+                  readSeq  #  sequence of the read
+                  chr  #  chromosome of reference where read maps
+                  refLength  #  length of the reference sequence where read maps to
+                  start  #  start position of reference sequence where read maps to
+                  end  #  end position of reference sequence where read maps to
+                  referenceSeq  #  reference sequence where read maps to
+                  strand  #  strand of reference
+                  mm  #  number of mismatches in the alignment
+                  MAPQ-like-string  #  m==perfect match, M==mismatch
+            </comment>
+		</tool>
+		<tool>
+		    <name>miRDeep2</name>
+			<version>miRDeep2.0.0.6</version>
+            <command_line>
+            <![CDATA[ miRDeep2.pl reads_collapsed.fa {genome} reads_vs_genome.arf {miRBase_mature} none {miRBase_hairpin} -t {Species} -P 2> miRDeep2.report.log ]]>
+            </command_line>
+            <loop>no looping</loop>
+            <comment>quantify known miRNAs and predict putative novel miRNAs across samples</comment>
+		</tool>
+		<tool>
+			<name>rename_according_to_metadata_standards</name>
+			<version>missing</version>
+            <command_line>
+            <![CDATA[ cp miRNAs_expressed_all_samples_DATE_t_TIME.csv {SampleID}.SXPv1.{DATE}.known.csv ]]>
+            </command_line>
+            <loop>no looping</loop>
+			<comment>rename output data file to conform to metadata naming standards</comment>
+		</tool>
+		<tool>
+			<name>mirdeep2_csv2bed.pl</name>
+			<version>missing</version>
+            <command_line>
+            <![CDATA[
+                mirdeep2_csv2bed.pl -r result_DATE_t_TIME.csv -p -T {SampleID}
+                cp known_pres_DATE_t_TIME_score-50_to_na.bed {SampleID}.SXPv1.{DATE}.known.bed
+                echo "track name=\"{SampleID}.novel_miRNAs\" description=\"novel miRNAs detected by miRDeep2 for {SampleID}\" visibility=2 itemRgb=\"On\"" > "{SampleID}.SXPv1.{DATE}.novel.bed"
+                cat "novel_pres_DATE_t_TIME_score-50_to_na.bed" >> "{SampleID}.SXPv1.{DATE}.novel.bed"
+            ]]>
+            </command_line>
+            <loop>no looping</loop>
+            <comment>
+                Generate BED tracks from the total precursor read counts of known and novel miRNAs and rename them according to metadata standards.
+                This tool has been uploaded to ASPERA.
+            </comment>
+		</tool>
+		<tool>
+			<name>bed_to_bedGraph</name>
+			<version>missing</version>
+            <command_line>
+            <![CDATA[
+                gawk 'NR==3 {print "track type=bedGraph description=\"miRDeep2 known miRNAs\" visibility=2 color=0,0,255 altColor=255,0,0" > FILENAME"Graph";  print $1,$2,$3,$5 >> FILENAME"Graph"} NR>3 {print $1,$2,$3,$5 >> FILENAME"Graph"}' "{SampleID}.SXPv1.{DATE}.known.bed"
+                gawk 'NR==1 {print "track type=bedGraph description=\"miRDeep2 novel miRNAs\" visibility=2 color=0,0,255 altColor=255,0,0" > FILENAME"Graph";  print $1,$2,$3,$5 >> FILENAME"Graph"} NR>1 {print $1,$2,$3,$5 >> FILENAME"Graph"}' "{SampleID}.SXPv1.{DATE}.novel.bed"
+            ]]>
+            </command_line>
+            <loop>no looping</loop>
+			<comment>convert BED tracks to bedGraph</comment>
+		</tool>
+	</software>
+</process>	
diff --git a/docs/quantification/transcriptome/SXPv2.xml b/docs/quantification/transcriptome/SXPv2.xml
new file mode 100644
index 0000000..63ad5f6
--- /dev/null
+++ b/docs/quantification/transcriptome/SXPv2.xml
@@ -0,0 +1,227 @@
+<?xml version="1.0"?>
+<?xml-stylesheet type="text/css" href="http://deep.mpi-inf.mpg.de/DAC/files/style/deep_process_style.css"?>
+<process>
+	<name>SXP</name>
+	<version>2</version>
+	<author>
+		<name>Filippos Klironomos</name>
+		<email>filippos.klironomos@mdc-berlin.de</email>
+	</author>
+    <description>
+    *) miRDeep2 pipeline involves:
+
+      *) mapping of reads to genome and keeping those uniquely mapped
+      *) extracting bracketing DNA of the uniquely mapped reads
+      *) RNAfold extracted sequences and keeping those that form unbifurcated hairpins
+      *) scoring putative precursors:
+         *) expect greater number of reads mapping to either the -5p or -3p strand and very little to the hairpin
+         *) short 3&apos; duplex overhang characteristic of Drosha/Dicer processing adds to the score
+         *) relative and absolute stabilities contribute to the score
+         *) if 5&apos; end of mature sequence is identical to that of known mature sequence it adds to the score
+      *) randomly permuting read signatures with putative precursor sequences in order to determine the FPR
+
+    Internally miRDeep2 uses the following packages:
+
+    RNAfold version 2.1.7
+    RANDFOLD version 2
+	</description>
+	<inputs>
+		<filetype>
+      <identifier>config</identifier>
+			<format>TSV</format>
+      <quantity>single</quantity>
+      <comment>
+        this is the configuration file that miRDeep2 uses to locate the FASTQ library and assign the 3-character identification to it
+      </comment>
+		</filetype>
+	</inputs>
+	<!-- Following section: list reference files [e.g. reference genomes] used in this process -->
+	<references>
+		<filetype>
+			<identifier>genome</identifier>
+			<format>fasta</format>
+			<quantity>single</quantity>
+      <comment>
+<![CDATA[
+        hs37d5 and GRCm38mm10 genomes are modified as follows:
+
+          *) IDs are simplified, everything to the right of the first white space encountered is removed,
+
+          *) all ambiguously called nucleotides [URYSWKMBDHV] have been masked to 'N'.
+
+        The following script does all this:
+        
+          sed -e 's/^>\(\S\+\)\s.*$/>\1/' -e '/^[^>]/s/[UuRrYySsWwKkMmBbDdHhVv]/N/g' hs37d5.fa > hs37d5_simple.fa
+          sed -e 's/^>\(\S\+\)\s.*$/>\1/' -e '/^[^>]/s/[UuRrYySsWwKkMmBbDdHhVv]/N/g' GRCm38mm10.fa > GRCm38mm10_simple.fa
+]]>
+      </comment>
+		</filetype>
+		<filetype>
+			<identifier>genome_index</identifier>
+			<format>bowtie-index</format>
+			<quantity>collection</quantity>
+      <comment>
+  	    bowtie version 1.1.1 index of hs37d5_simple.fa and GRCm38mm10_simple.fa generated as follows:
+
+          bowtie-build -f hs37d5_simple.fa hs37d5_simple.fa
+          bowtie-build -f GRCm38mm10_simple.fa GRCm38mm10_simple.fa
+      </comment>
+		</filetype>
+		<filetype>
+			<identifier>miRBase_mature</identifier>
+			<format>fasta</format>
+			<quantity>single</quantity>
+			<comment>mature known miRNA reference from miRBase Release 20 uploaded to ASPERA</comment>
+		</filetype>
+		<filetype>
+			<identifier>miRBase_hairpin</identifier>
+			<format>fasta</format>
+			<quantity>single</quantity>
+			<comment>precursor (hairpin) known miRNA reference from miRBase Release 20 uploaded to ASPERA</comment>
+		</filetype>
+	</references>
+	<!-- Following section: list output files of process [e.g. bed files, wiggle tracks] -->
+	<outputs>
+		<filetype>
+      <identifier>SampleID.SXPv2.DATE.known.csv</identifier>
+			<format>csv</format>
+			<quantity>single</quantity>
+      <comment>
+        expression of known miRNAs quantified by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv2.DATE.known.bed</identifier>
+			<format>bed</format>
+			<quantity>single</quantity>
+      <comment>
+        BED track of expression of known miRNAs quantified by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv2.DATE.known.bedGraph</identifier>
+			<format>bedGraph</format>
+			<quantity>single</quantity>
+      <comment>
+        bedGraph track of expression of known miRNAs quantified by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv2.DATE.novel.bed</identifier>
+			<format>bed</format>
+			<quantity>single</quantity>
+      <comment>
+        bed track of expression of novel miRNAs predicted by miRDeep2
+      </comment>
+		</filetype>
+		<filetype>
+      <identifier>SampleID.SXPv2.DATE.novel.bedGraph</identifier>
+			<format>bedGraph</format>
+			<quantity>single</quantity>
+      <comment>
+        bedGraph track of expression of novel miRNAs predicted by miRDeep2
+      </comment>
+		</filetype>
+	</outputs>
+	<!-- Precise description of what this process does, what output is generated and what statistics are computed -->
+
+	<software>
+		<tool>
+      <name>generate_config</name>
+			<version>missing</version>
+      <command_line>
+            <![CDATA[
+                echo -ne "{SampleID.fastq}\tID1\n" > config
+            ]]>
+      </command_line>
+      <loop>no looping</loop>
+      <comment>
+        this command creates the configuration file for miRDeep2 to use in order to locate the FASTQ library {SampleID.fastq} and assign
+        a 3-letter internal ID to it, in this case ID1
+      </comment>
+		</tool>
+		<tool>
+			<name>mapper.pl</name>
+			<version>miRDeep2.0.0.7</version>
+      <command_line>
+        <![CDATA[
+            mapper.pl config -d -e -h -j -k {Adaptor} -l 18 -m -p {genome_index} -s reads_collapsed.fa -t reads_vs_genome.arf -v -o 12  &> mapper_summary.log
+        ]]>
+      </command_line>
+      <loop>no looping</loop>
+      <comment>
+        use the configuration file to locate the library; remove adaptor provided by {Adaptor}; 
+        collapse the reads to the file "read_collapsed.fa";
+        map to the reference and output the alignments in the file "reads_vs_genome.arf";
+        print out summary in "mapper_summary.log"
+
+        The ARF is a text-based format consisting of the following columns:
+
+          readID  #  the ID of the read 
+          readLength  #  length of the read
+          start  #  start position of the alignment relative to the read
+          end  #  end position of the alignment relative to the read
+          readSeq  #  sequence of the read
+          chr  #  chromosome of reference where read maps
+          refLength  #  length of the reference sequence where read maps to
+          start  #  start position of reference sequence where read maps to 
+          end  #  end position of reference sequence where read maps to 
+          referenceSeq  #  reference sequence where read maps to 
+          strand  #  strand of reference
+          mm  #  number of mismatches in the alignment
+          MAPQ-like-string  #  m==perfect match, M==mismatch
+      </comment>
+		</tool>
+		<tool>
+			<name>miRDeep2</name>
+			<version>miRDeep2.0.0.7</version>
+      <command_line>
+<![CDATA[
+        miRDeep2.pl reads_collapsed.fa {genome} reads_vs_genome.arf {miRBase_mature} none {miRBase_hairpin} -t {Species} -P -d -v 2> miRDeep2.report.log
+]]>
+      </command_line>
+      <loop>no looping</loop>
+			<comment>quantify known miRNAs and predict putative novel miRNAs across samples</comment>
+		</tool>
+		<tool>
+			<name>rename_according_to_metadata_standards</name>
+			<version>missing</version>
+      <command_line>
+<![CDATA[
+        cp miRNAs_expressed_all_samples_DATE_t_TIME.csv {SampleID}.SXPv2.{DATE}.known.csv
+]]>
+      </command_line>
+      <loop>no looping</loop>
+      <comment>rename output data file to conform to metadata naming standards</comment>
+		</tool>
+		<tool>
+			<name>mirdeep2_csv2bed.pl</name>
+			<version>missing</version>
+      <command_line>
+<![CDATA[
+        mirdeep2_csv2bed.pl -r result_DATE_t_TIME.csv -p -T {SampleID} 
+        cp known_pres_DATE_t_TIME_score-50_to_na.bed {SampleID}.SXPv2.{DATE}.known.bed
+        echo "track name=\"{SampleID}.novel_miRNAs\" description=\"novel miRNAs detected by miRDeep2 for {SampleID}\" visibility=2 itemRgb=\"On\"" > "{SampleID}.SXPv2.{DATE}.novel.bed"
+        cat "novel_pres_DATE_t_TIME_score-50_to_na.bed" >> "{SampleID}.SXPv2.{DATE}.novel.bed"
+]]>
+      </command_line>
+      <loop>no looping</loop>
+      <comment>
+        Generate BED tracks from the total precursor read counts of known and novel miRNAs and rename them according to metadata standards.
+        This tool has been uploaded to ASPERA.
+      </comment>
+		</tool>
+		<tool>
+			<name>bed_to_bedGraph</name>
+			<version>missing</version>
+      <command_line>
+<![CDATA[
+        gawk 'NR==3 {print "track type=bedGraph description=\"miRDeep2 known miRNAs\" visibility=2 color=0,0,255 altColor=255,0,0" > FILENAME"Graph";  print $1,$2,$3,$5 >> FILENAME"Graph"} NR>3 {print $1,$2,$3,$5 >> FILENAME"Graph"}' "{SampleID}.SXPv2.{DATE}.known.bed"
+        gawk 'NR==1 {print "track type=bedGraph description=\"miRDeep2 novel miRNAs\" visibility=2 color=0,0,255 altColor=255,0,0" > FILENAME"Graph";  print $1,$2,$3,$5 >> FILENAME"Graph"} NR>1 {print $1,$2,$3,$5 >> FILENAME"Graph"}' "{SampleID}.SXPv2.{DATE}.novel.bed"
+]]>
+      </command_line>
+      <loop>no looping</loop>
+			<comment>convert BED tracks to bedGraph</comment>
+		</tool>
+	</software>
+</process>