annotate aws_sra.xml @ 28:8e6c35583761 draft

planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 133ce5adcf21338376fb8a1fa0003d97ffc8cbbb
author galaxytrakr
date Tue, 24 Mar 2026 01:35:38 +0000
parents 4f6a7017cbbb
children 569a598c7e68
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
28
8e6c35583761 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 133ce5adcf21338376fb8a1fa0003d97ffc8cbbb
galaxytrakr
parents: 27
diff changeset
1 <tool id="aws_sra" name="NCBI SRA AWS Fetch" version="0.4.0+gt_0.7" profile="23.0">
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
2 <description>Fetches one or more SRA runs from AWS S3 and converts them to FASTQ</description>
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
3
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
4 <requirements>
2
83c923bd9da6 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit a95de952e58b29875b31e55f0ef06a83a18618fc
galaxytrakr
parents: 1
diff changeset
5 <requirement type="package" version="2.34.8">awscli</requirement>
83c923bd9da6 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit a95de952e58b29875b31e55f0ef06a83a18618fc
galaxytrakr
parents: 1
diff changeset
6 <requirement type="package" version="3.2.1">sra-tools</requirement>
83c923bd9da6 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit a95de952e58b29875b31e55f0ef06a83a18618fc
galaxytrakr
parents: 1
diff changeset
7 <requirement type="package" version="2.8">pigz</requirement>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
8 </requirements>
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
9
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
10 <version_command>fasterq-dump --version</version_command>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
11
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
12 <command detect_errors="aggressive"><![CDATA[
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
13 ## Create a clean list of accessions from the user input
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
14 echo "$accession" | sed 's/,/\n/g; s/ \+/\n/g' | grep . > accessions.txt &&
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
15
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
16 ## Loop over each clean accession
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
17 for acc in $(cat accessions.txt);
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
18 do
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
19 echo "Processing accession: $acc" &&
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
20
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
21 ## 1. Create unique directories for this accession
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
22 mkdir -p sra_cache_${acc} fastq_out_${acc} &&
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
24 ## 2. Download the file from S3 using aws s3 cp
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
25 aws s3 cp --no-sign-request "s3://sra-pub-run-odp/sra/${acc}/${acc}" ./sra_cache_${acc}/ &&
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
26
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
27 ## 3. Convert with fasterq-dump
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
28 fasterq-dump --outdir ./fastq_out_${acc} --temp . --threads \${GALAXY_SLOTS:-4} --split-files ./sra_cache_${acc}/${acc} &&
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
29
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
30 ## 4. Compress with pigz
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
31 pigz -p \${GALAXY_SLOTS:-4} ./fastq_out_${acc}/*.fastq &&
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
32
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
33 ## 5. Move outputs for collection discovery
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
34 #if str($layout) == 'paired'
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
35 mv ./fastq_out_${acc}/${acc}_1.fastq.gz '$output_r1.files_path/${acc}_1.fastq.gz' &&
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
36 mv ./fastq_out_${acc}/${acc}_2.fastq.gz '$output_r2.files_path/${acc}_2.fastq.gz'
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
37 #else
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
38 mv ./fastq_out_${acc}/${acc}.fastq.gz '$output_r1.files_path/${acc}.fastq.gz'
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
39 #end if &&
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
40
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
41 ## 6. Clean up
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
42 rm -rf sra_cache_${acc} fastq_out_${acc}
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
43 done
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
44 ]]></command>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
45
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
46 <inputs>
28
8e6c35583761 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 133ce5adcf21338376fb8a1fa0003d97ffc8cbbb
galaxytrakr
parents: 27
diff changeset
47 <param name="accession" type="text" label="SRA Accession(s)" value="" optional="false" help="Provide one or more accession numbers (separated by commas, spaces, or newlines)."/>
8e6c35583761 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 133ce5adcf21338376fb8a1fa0003d97ffc8cbbb
galaxytrakr
parents: 27
diff changeset
48 <param name="layout" type="select" label="Read layout" optional="false" help="This setting is applied to all accessions.">
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
49 <option value="paired" selected="true">Paired-end (R1 + R2)</option>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
50 <option value="single">Single-end</option>
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
51 </param>
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
52 </inputs>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
53
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
54 <outputs>
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
55 <collection name="output_r1" type="list" label="FASTQ Reads (R1) for ${accession}">
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
56 <discover_datasets pattern="(?P&lt;designation&gt;.+)_1\.fastq\.gz" format="fastqsanger.gz" />
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
57 </collection>
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
58 <collection name="output_r2" type="list" label="FASTQ Reads (R2) for ${accession}">
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
59 <discover_datasets pattern="(?P&lt;designation&gt;.+)_2\.fastq\.gz" format="fastqsanger.gz" />
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
60 <filter>layout == 'paired'</filter>
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
61 </collection>
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
62 </outputs>
17
9fb80e0392ce planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 9707fa5e3ca6db5b58f271d133484d078cf65390
galaxytrakr
parents: 16
diff changeset
63
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
64 <tests>
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
65 <test expect_num_outputs="2">
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
66 <param name="accession" value="SRR13333333"/>
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
67 <param name="layout" value="paired"/>
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
68 <output_collection name="output_r1" type="list" count="1">
24
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
69 <element name="SRR13333333_1" ftype="fastqsanger.gz">
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
70 <assert_contents>
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
71 <has_text text="@SRR13333333"/>
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
72 </assert_contents>
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
73 </element>
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
74 </output_collection>
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
75 <output_collection name="output_r2" type="list" count="1">
24
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
76 <element name="SRR13333333_2" ftype="fastqsanger.gz">
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
77 <assert_contents>
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
78 <has_text text="@SRR13333333"/>
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
79 </assert_contents>
7dbb60c48056 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 29ed254c4aaab320b5482db410bd236d00f1b70e
galaxytrakr
parents: 23
diff changeset
80 </element>
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
81 </output_collection>
21
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
82 </test>
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
83 </tests>
02f45c03c306 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit f72940592c22c9ba88f1dcb23ef8bb5199ce434e
galaxytrakr
parents: 20
diff changeset
84
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
85 <help><![CDATA[
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
86 **NCBI SRA AWS Fetch**
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
87
23
d7f68b3cde39 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit e9adf514c1b6b341c9e5bf8cc5a41c79b738d48e
galaxytrakr
parents: 22
diff changeset
88 Fetches one or more SRA runs from the public `sra-pub-run-odp` S3 bucket and converts them to gzip-compressed FASTQ using `fasterq-dump`. This tool uses `aws s3 cp` for direct downloads within the AWS environment.
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
89 ]]></help>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
90
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
91 <citations>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
92 <citation type="bibtex">
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
93 @misc{ncbi_sra_aws,
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
94 title = {{NCBI} {SRA} on {AWS} Open Data},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
95 author = {{National Center for Biotechnology Information}},
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
96 howpublished = {\\url{https://registry.opendata.aws/ncbi-sra/}},
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
97 note = {Accessed via AWS S3 without credentials}
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
98 }
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
99 </citation>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
100 <citation type="bibtex">
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
101 @article{sra_toolkit,
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
102 title = {The {NCBI} {SRA} and portable data in biology},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
103 author = {Leinonen, Rasko and Sugawara, Hideaki and Shumway, Martin and
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
104 {International Nucleotide Sequence Database Collaboration}},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
105 journal = {Nucleic Acids Research},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
106 volume = {39},
13
2897d365dd62 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit 619ebd7e6a24be0ec6c2728511290f43b0bad89f
galaxytrakr
parents: 12
diff changeset
107 number = {suppl\\\_1},
0
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
108 pages = {D19--D21},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
109 year = {2011},
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
110 doi = {10.1093/nar/gkq1019}
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
111 }
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
112 </citation>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
113 </citations>
a4afe551dfc9 planemo upload for repository https://github.com/CFSAN-Biostatistics/galaxytrakr-tools commit c55c06b92c0ee0429047bcff1992bf2ec293284a
galaxytrakr
parents:
diff changeset
114 </tool>