-
Notifications
You must be signed in to change notification settings - Fork 0
/
cellranger-arc-mkref.cwl
171 lines (139 loc) · 4.35 KB
/
cellranger-arc-mkref.cwl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
cwlVersion: v1.0
class: CommandLineTool
requirements:
- class: InlineJavascriptRequirement
expressionLib:
- var get_output_folder_name = function() {
if (inputs.output_folder_name == ""){
var root = inputs.genome_fasta_file.basename.split('.').slice(0,-1).join('.');
return (root == "")?inputs.genome_fasta_file.basename:root;
} else {
return inputs.output_folder_name;
}
};
- class: InitialWorkDirRequirement
listing: |
${
var exclude_chr = "[]";
if (inputs.exclude_chr && inputs.exclude_chr.length > 0){
exclude_chr = '["' + inputs.exclude_chr.join('", "') + '"]'
}
var entry = `
{
genome: ["${get_output_folder_name()}"]
input_fasta: ["${inputs.genome_fasta_file.path}"]
input_gtf: ["${inputs.annotation_gtf_file.path}"]
non_nuclear_contigs: ${exclude_chr}
}`
return [{
"entry": entry,
"entryname": "config.txt"
}];
}
hints:
- class: DockerRequirement
dockerPull: cumulusprod/cellranger-arc:2.0.0
inputs:
genome_fasta_file:
type: File
doc: |
Genome FASTA file
annotation_gtf_file:
type: File
doc: |
GTF annotation file.
exclude_chr:
type:
- "null"
- string[]
doc: |
Contigs that do not have any chromatin structure, for example,
mitochondria or plastids. These contigs are excluded from peak
calling since the entire contig will be "open" due to a lack of
chromatin structure
output_folder_name:
type: string?
default: ""
doc: |
Unique genome name, used to name output folder
threads:
type: int?
inputBinding:
position: 5
prefix: "--nthreads"
doc: |
Number of threads used during STAR genome indexing
Default: 1
memory_limit:
type: int?
inputBinding:
position: 6
prefix: "--memgb"
doc: |
Maximum memory (GB) used when aligning reads with STAR
Defaults: 16
outputs:
indices_folder:
type: Directory
outputBinding:
glob: $(get_output_folder_name())
doc: |
Compatible with Cell Ranger ARC reference folder that includes
STAR and BWA indices
stdout_log:
type: stdout
stderr_log:
type: stderr
baseCommand: ["cellranger-arc", "mkref", "--config", "config.txt"]
stdout: cellranger_arc_mkref_stdout.log
stderr: cellranger_arc_mkref_stderr.log
$namespaces:
s: http://schema.org/
$schemas:
- https://github.com/schemaorg/schemaorg/raw/main/data/releases/11.01/schemaorg-current-http.rdf
label: "Cell Ranger ARC Build Reference Indices"
s:name: "Cell Ranger ARC Build Reference Indices"
s:alternateName: |
Builds Cell Ranger ARC compatible reference folder from the
custom genome FASTA and gene GTF annotation files
s:downloadUrl: https://raw.githubusercontent.com/Barski-lab/sc-seq-analysis/main/tools/cellranger-arc-mkref.cwl
s:codeRepository: https://github.com/Barski-lab/sc-seq-analysis
s:license: http://www.apache.org/licenses/LICENSE-2.0
s:isPartOf:
class: s:CreativeWork
s:name: Common Workflow Language
s:url: http://commonwl.org/
s:creator:
- class: s:Organization
s:legalName: "Cincinnati Children's Hospital Medical Center"
s:location:
- class: s:PostalAddress
s:addressCountry: "USA"
s:addressLocality: "Cincinnati"
s:addressRegion: "OH"
s:postalCode: "45229"
s:streetAddress: "3333 Burnet Ave"
s:telephone: "+1(513)636-4200"
s:logo: "https://www.cincinnatichildrens.org/-/media/cincinnati%20childrens/global%20shared/childrens-logo-new.png"
s:department:
- class: s:Organization
s:legalName: "Allergy and Immunology"
s:department:
- class: s:Organization
s:legalName: "Barski Research Lab"
s:member:
- class: s:Person
s:name: Michael Kotliar
s:email: mailto:[email protected]
s:sameAs:
- id: http://orcid.org/0000-0002-6486-3898
doc: |
Cell Ranger ARC Build Reference Indices
Builds Cell Ranger ARC compatible reference folder from the custom
genome FASTA and gene GTF annotation files.
Notes:
- `input_motifs` parameter in the `config.txt` file is not
implemented.
- if GTF file provided in `annotation_gtf_file` has records with
duplicate gene_id, they should be grouped together. Applicable to
USCS RefGene annotations.