galaxyproject · bernt-matthias · Feb 17, 2023 · Jan 16, 2023 · Jan 16, 2023 · Jan 17, 2023
diff --git a/tools/rgrnastar/macros.xml b/tools/rgrnastar/macros.xml
@@ -5,7 +5,7 @@
     the index versions in sync, but you should manually adjust the +galaxy
     version number. -->
 <tool id="rna_star_index_builder_data_manager" name="rnastar index versioned" tool_type="manage_data" version="@IDX_VERSION@" profile="19.05"> 
 <tool id="rna_star_index_builder_data_manager" name="rnastar index versioned" tool_type="manage_data" version="@IDX_VERSION@" profile="19.05"> 
     <!-- STAR version to be used -->
-    <token name="@VERSION@">2.7.8a</token>
+    <token name="@VERSION@">2.7.10b</token>
     <!-- STAR index version compatible with this version of STAR
     This is the STAR version that introduced the index structure expected
     by the current version.
@@ -19,7 +19,7 @@
     <xml name="requirements">
         <requirements>
             <requirement type="package" version="@VERSION@">star</requirement>
-            <requirement type="package" version="1.9">samtools</requirement>
+            <requirement type="package" version="1.16.1">samtools</requirement>
             <yield />
         </requirements>
     </xml>
@@ -35,7 +35,7 @@
     </xml>
 
     <xml name="index_selection" token_with_gene_model="0">
-        <param argument="--genomeDir" name="genomeDir" type="select"
+        <param argument="--genomeDir" type="select"
         label="Select reference genome"
         help="If your genome of interest is not listed, contact the Galaxy team">
             <options from_data_table="@IDX_DATA_TABLE@">
@@ -81,11 +81,16 @@
     <token name="@TEMPINDEX@"><![CDATA[
     ## Create temporary index for custom reference
     #if str($refGenomeSource.geneSource) == 'history':
+        #if $refGenomeSource.genomeFastaFiles.ext == "fasta"
+            ln -s '$refGenomeSource.genomeFastaFiles' refgenome.fa &&
+        #else
+            gunzip -c '$refGenomeSource.genomeFastaFiles' > refgenome.fa &&
+        #end if
         mkdir -p tempstargenomedir &&
         STAR
             --runMode genomeGenerate
             --genomeDir 'tempstargenomedir'
-            --genomeFastaFiles '${refGenomeSource.genomeFastaFiles}'
+            --genomeFastaFiles refgenome.fa
             ## Handle difference between indices with/without annotations
             #if 'GTFconditional' in $refGenomeSource:
                 ## GTFconditional exists only in STAR, but not STARsolo
@@ -161,8 +166,13 @@
         @FASTQ_GZ_OPTION@
     #end if
     ]]></token>
+    <token name="@LIMITS@" ><![CDATA[
+        --limitOutSJoneRead $algo.params.limits.limitOutSJoneRead
+        --limitOutSJcollapsed $algo.params.limits.limitOutSJcollapsed
+        --limitSjdbInsertNsj $algo.params.limits.limitSjdbInsertNsj
+    ]]></token>
     <xml name="ref_selection">
-        <param argument="--genomeFastaFiles" type="data" format="fasta" label="Select a reference genome" />
+        <param argument="--genomeFastaFiles" type="data" format="fasta,fasta.gz" label="Select a reference genome" />
           <param argument="--genomeSAindexNbases" type="integer" min="2" max="16" value="14" label="Length of the SA pre-indexing string" help="Typically between 10 and 15. Longer strings will use much more memory, but allow faster searches. For small genomes, the parameter --genomeSAindexNbases must be scaled down to min(14, log2(GenomeLength)/2 - 1)"/>
     </xml>
     <xml name="stdio" >
@@ -245,4 +255,21 @@
             <option value="None" >No adapter clipping</option>
         </param>
     </xml>
+    <xml name="common_SAM_attributes">
+        <option value="NH" selected="true">NH (number of reported alignments/hits for the read)</option>
+        <option value="HI" selected="true">HI (query hit index)</option>
+        <option value="AS" selected="true">AS (local alignment score)</option>
+        <option value="nM" selected="true">nM (number of mismatches per (paired) alignment)</option>
+        <option value="NM">NM (edit distance of the aligned read to the reference)</option>
+        <option value="MD">MD (string for mismatching positions)</option>
+        <option value="jM">jM (intron motifs for all junctions)</option>
+        <option value="jI">jI (1-based start and end of introns for all junctions)</option>
+    </xml>
+    <xml name="limits">
+        <section name="junction_limits" title="Limits" expanded="false">
+            <param argument="--limitOutSJoneRead" type="integer" min="1" value="1000" label="Maximum number of junctions for one read (including all multimappers)" />
+            <param argument="--limitOutSJcollapsed" type="integer" min="1" value="1000000" label="Maximum number of collapsed junctions" />
+            <param argument="--limitSjdbInsertNsj" type="integer" min="0" value="1000000" label="Maximum number of inserts to be inserted into the genome on the fly." />
+        </section>
+    </xml>
 </macros>
diff --git a/tools/rgrnastar/rg_rnaStar.xml b/tools/rgrnastar/rg_rnaStar.xml
@@ -1,4 +1,8 @@
-<tool id="rna_star" name="RNA STAR" version="@VERSION@+galaxy1" profile="20.01" license="MIT">
+<<<<<<< HEAD
+<tool id="rna_star" name="RNA STAR" version="@VERSION@+galaxy0" profile="20.01" license="MIT">
+=======
+<tool id="rna_star" name="RNA STAR" version="@VERSION@+galaxy2" profile="21.01" license="MIT">
+>>>>>>> 3ce631f61 (STAR: allow fasta.gz for reference)
     <description>Gapped-read mapper for RNA-seq data</description>
     <macros>
         <import>macros.xml</import>
@@ -206,9 +210,7 @@
             #end if
 
             ## Limits
-            --limitOutSJoneRead $algo.params.limits.limitOutSJoneRead
-            --limitOutSJcollapsed $algo.params.limits.limitOutSJcollapsed
-            --limitSjdbInsertNsj $algo.params.limits.limitSjdbInsertNsj
+                @LIMITS@
         #else:
             ## Go with STAR's default algorithmic settings,
             ## but we need to provide a reasonable default
@@ -373,16 +375,9 @@
             label="Read alignment tags to include in the BAM output"
             help="Note on using the XS tag: If the XS tag is used, STAR will filter out alignments with undefined strand (i.e., those containing only non-canonical unannotated junctions). Using this tag is recommended if you plan to use the STAR results with STAR-Fusion. In addition, it is required for compatibility
 with Cufflinks if your sequences come from an unstranded library preparation.">
-                <option value="NH" selected="true">NH (number of reported alignments/hits for the read)</option>
-                <option value="HI" selected="true">HI (query hit index)</option>
-                <option value="AS" selected="true">AS (local alignment score)</option>
-                <option value="nM" selected="true">nM (number of mismatches per (paired) alignment)</option>
-                <option value="XS">XS (strand flag, see parameter help below) </option>
-                <option value="NM">NM (edit distance of the aligned read to the reference)</option>
-                <option value="MD">MD (string for mismatching positions)</option>
+                <expand macro="common_SAM_attributes"/>
                 <option value="MC">MC (CIGAR string for mate/next segment)</option>
-                <option value="jM">jM (intron motifs for all junctions)</option>
-                <option value="jI">jI (1-based start and end of introns for all junctions)</option>
+                <option value="XS">XS (strand flag, see parameter help below) </option>
                 <option value="ch" selected="true">ch (used to indicate chimeric alignments)</option>
             </param>
             <param argument="--outSAMattrIHstart" name="HI_offset" type="select" display="radio"
@@ -469,7 +464,7 @@ used: >=5 mappings => MAPQ=0; 3-4 mappings => MAPQ=1; 2 mappings => MAPQ=3. This
                     </section>
 
                     <section name="align" title="Alignment parameters" expanded="false">
-                        <param argument="--alignIntronMin" name="alignIntronMin" type="integer" min="0" value="21" label="Minimum intron size"/>
+                        <param argument="--alignIntronMin" type="integer" min="0" value="21" label="Minimum intron size"/>
                         <param argument="--alignIntronMax" type="integer" min="0" value="0" label="Maximum intron size"/>
                         <param argument="--alignMatesGapMax" type="integer" min="0" value="0" label="Maximum gap between two mates"/>
                         <param argument="--alignSJoverhangMin" type="integer" min="1" value="5" label="Minimum overhang for spliced alignments"/>
@@ -518,12 +513,7 @@ used: >=5 mappings => MAPQ=0; 3-4 mappings => MAPQ=1; 2 mappings => MAPQ=3. This
                         <param argument="--chimMultimapScoreRange" type="integer" min="0" value="1"
                         label="Score range for multi-mapping chimeras"
                         help="The threshold below the best chimeric score that a multimapping chimera must have to be output. This is ignored unless --chimMultimapNmax is above 1" />
-                    </section>
-                    <section name="limits" title="Limits" expanded="false">
-                        <param argument="--limitOutSJoneRead" type="integer" min="1" value="1000" label="Maximum number of junctions for one read (including all multimappers)" />
-                        <param argument="--limitOutSJcollapsed" type="integer" min="1" value="1000000" label="Maximum number of collapsed junctions" />
-                        <param argument="--limitSjdbInsertNsj" type="integer" min="0" value="1000000" label="Maximum number of inserts to be inserted into the genome on the fly." />
-                    </section>
+                        <expand macro="limits" />
                 </when>
             </conditional>
         </section>
@@ -570,7 +560,7 @@ used: >=5 mappings => MAPQ=0; 3-4 mappings => MAPQ=1; 2 mappings => MAPQ=3. This
             </conditional>
             <conditional name="refGenomeSource">
                 <param name="geneSource" value="history" />
-                <param name="genomeFastaFiles" value="tophat_test.fa" />
+                <param name="genomeFastaFiles" value="tophat_test.fa.gz" />
                 <param name="genomeSAindexNbases" value="5" />
             </conditional>
             <section name="oformat">
@@ -1024,7 +1014,7 @@ generated. Hence, be sure to select either:
 In addition, the following parameters_ related to chimeric alignment are recommended for improved sensitivity
 
 - under *Output filter criteria*,
-  **Would you like to set additional output filters?**: select `Yes' to set 
+  **Would you like to set additional output filters?**: select `Yes` to set 
   **Maximum number of alignments to output a read's alignment results, plus 1** to 50 
 
 - under *Algorithmic settings*, **Configure seed, alignment and limits options**: