annotate aws_sra.xml @ 16:58cc45662c63 draft

planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
author galaxytrakr
date Mon, 23 Mar 2026 20:23:58 +0000
parents 25cf81d65cb8
children 9fb80e0392ce
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
16
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
1 <tool id="aws_sra" name="NCBI SRA AWS Fetch" version="0.3.0+gt_0.16" profile="23.0">
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
2 <description>Fetches SRA runs from AWS and converts them to FASTQ</description>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
3
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
4 <requirements>
2
83c923bd9da6 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit a95de952e58b29875b31e55f0ef06a83a18618fc
galaxytrakr
parents: 1
diff changeset
5 <requirement type="package" version="2.34.8">awscli</requirement>
83c923bd9da6 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit a95de952e58b29875b31e55f0ef06a83a18618fc
galaxytrakr
parents: 1
diff changeset
6 <requirement type="package" version="3.2.1">sra-tools</requirement>
83c923bd9da6 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit a95de952e58b29875b31e55f0ef06a83a18618fc
galaxytrakr
parents: 1
diff changeset
7 <requirement type="package" version="2.8">pigz</requirement>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
8 </requirements>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
9
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
10 <version_command>fasterq-dump --version</version_command>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
11
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
12 <command detect_errors="aggressive"><![CDATA[
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
13 ## This loop handles both 'single' and 'batch' modes.
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
14 #for $acc_line in $run_type.mode == 'single' and str($run_type.accession).split() or $run_type.accession_list.lines:
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
15 #set $acc = $acc_line.strip()
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
16 #if $acc:
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
17
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
18 echo "Processing accession: $acc" &&
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
19
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
20 ## 1. Create unique directories for this accession
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
21 mkdir -p sra_cache_${acc} fastq_out_${acc} &&
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
22
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
23 ## 2. Download the file from S3 using the discovered path format
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
24 aws s3 cp --no-sign-request 's3://sra-pub-run-odp/sra/${acc}/${acc}' ./sra_cache_${acc}/ &&
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
25
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
26 ## 3. Convert with fasterq-dump, using the correct argument order
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
27 fasterq-dump --outdir ./fastq_out_${acc} --temp . --threads \${GALAXY_SLOTS:-4} --split-files ./sra_cache_${acc}/${acc} &&
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
28
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
29 ## 4. Compress with pigz
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
30 pigz -p \${GALAXY_SLOTS:-4} ./fastq_out_${acc}/*.fastq &&
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
31
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
32 ## 5. Move outputs to special directories Galaxy can discover
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
33 #if $layout == 'paired'
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
34 mv ./fastq_out_${acc}/${acc}_1.fastq.gz '$output_r1.files_path/${acc}_1.fastq.gz' &&
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
35 mv ./fastq_out_${acc}/${acc}_2.fastq.gz '$output_r2.files_path/${acc}_2.fastq.gz'
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
36 #else
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
37 mv ./fastq_out_${acc}/*.fastq.gz '$output_r1.files_path/${acc}.fastq.gz'
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
38 #end if &&
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
39
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
40 ## 6. Clean up temporary files
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
41 rm -rf sra_cache_${acc} fastq_out_${acc}
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
42
6
8c60cd4c0ca7 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 69bae7a0b8011217f6c61fbc62344bcd6a445160
galaxytrakr
parents: 5
diff changeset
43 #end if
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
44 #end for
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
45 ]]></command>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
46
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
47 <inputs>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
48 <!-- This conditional allows the user to choose a single run or a list of runs -->
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
49 <conditional name="run_type">
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
50 <param name="mode" type="select" label="Execution Mode" help="Run on a single accession or a list of accessions from a file.">
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
51 <option value="single" selected="true">Single Accession</option>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
52 <option value="batch">Batch of Accessions</option>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
53 </param>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
54 <when value="single">
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
55 <param name="accession" type="text" label="SRA Accession" help="e.g., SRR13333333"/>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
56 </when>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
57 <when value="batch">
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
58 <param name="accession_list" type="data" format="txt" label="List of SRA Accessions" help="A plain text file with one SRA accession per line."/>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
59 </when>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
60 </conditional>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
61
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
62 <!-- This layout parameter is always required -->
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
63 <param name="layout" type="select" label="Read layout" help="Check the SRA record to confirm layout before running.">
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
64 <option value="paired" selected="true">Paired-end (R1 + R2)</option>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
65 <option value="single">Single-end</option>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
66 </param>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
67 </inputs>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
68
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
69 <outputs>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
70 <!-- These collections will gather all the files produced by the loop -->
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
71 <collection name="output_r1" type="list" label="${run_type.accession or 'FASTQ Reads (R1)'}">
15
25cf81d65cb8 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit fd740a9434d21f68658fe261b1b043033e491b05
galaxytrakr
parents: 14
diff changeset
72 <discover_datasets pattern="(?P&lt;designation&gt;.+)_1\.fastq\.gz" format="fastqsanger.gz" />
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
73 </collection>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
74 <collection name="output_r2" type="list" label="${run_type.accession or 'FASTQ Reads (R2)'}">
15
25cf81d65cb8 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit fd740a9434d21f68658fe261b1b043033e491b05
galaxytrakr
parents: 14
diff changeset
75 <discover_datasets pattern="(?P&lt;designation&gt;.+)_2\.fastq\.gz" format="fastqsanger.gz" />
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
76 <filter>layout == 'paired'</filter>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
77 </collection>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
78 </outputs>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
79
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
80 <tests>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
81 <test expect_num_outputs="2">
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
82 <param name="mode" value="single"/>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
83 <param name="accession" value="SRR13333333"/>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
84 <param name="layout" value="paired"/>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
85 <output_collection name="output_r1" type="list" count="1">
16
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
86 <element name="SRR13333333_1" ftype="fastqsanger.gz">
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
87 <assert_contents>
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
88 <has_text text="@SRR13333333"/>
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
89 </assert_contents>
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
90 </element>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
91 </output_collection>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
92 <output_collection name="output_r2" type="list" count="1">
16
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
93 <element name="SRR13333333_2" ftype="fastqsanger.gz">
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
94 <assert_contents>
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
95 <has_text text="@SRR13333333"/>
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
96 </assert_contents>
58cc45662c63 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 98b1c300d492ffb675d64e6c64484c681b277369
galaxytrakr
parents: 15
diff changeset
97 </element>
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
98 </output_collection>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
99 </test>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
100 </tests>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
101
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
102 <help><![CDATA[
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
103 **NCBI SRA AWS Fetch**
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
104
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
105 Fetches SRA runs from the public `sra-pub-run-odp` bucket on Amazon S3 and converts them to gzip-compressed FASTQ using `fasterq-dump`.
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
106
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
107 This tool can be run on a single SRA accession or a list of accessions provided as a text file (one per line).
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
108
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
109 Outputs are automatically organized into collections suitable for downstream analysis.
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
110 ]]></help>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
111
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
112 <citations>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
113 <citation type="bibtex">
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
114 @misc{ncbi_sra_aws,
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
115 title = {{NCBI} {SRA} on {AWS} Open Data},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
116 author = {{National Center for Biotechnology Information}},
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
117 howpublished = {\\url{https://registry.opendata.aws/ncbi-sra/}},
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
118 note = {Accessed via AWS S3 without credentials}
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
119 }
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
120 </citation>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
121 <citation type="bibtex">
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
122 @article{sra_toolkit,
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
123 title = {The {NCBI} {SRA} and portable data in biology},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
124 author = {Leinonen, Rasko and Sugawara, Hideaki and Shumway, Martin and
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
125 {International Nucleotide Sequence Database Collaboration}},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
126 journal = {Nucleic Acids Research},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
127 volume = {39},
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
128 number = {suppl\\\_1},
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
129 pages = {D19--D21},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
130 year = {2011},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
131 doi = {10.1093/nar/gkq1019}
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
132 }
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
133 </citation>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
134 </citations>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
135 </tool>