-
Notifications
You must be signed in to change notification settings - Fork 1
/
protein_evidence_mapping.cwl
99 lines (95 loc) · 2.39 KB
/
protein_evidence_mapping.cwl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
#!/usr/bin/env cwl-runner
cwlVersion: v1.0
class: Workflow
inputs:
contigs_fasta:
label: "Genomic contigs (FASTA)"
type: File
format: edam:format_1929
proteins_fasta:
label: "Proteins (FASTA)"
type: File
format: edam:format_1929
species_table:
label: "Spaln species table to use (optional)"
type: string?
outputs:
spaln_out:
type: File
outputSource:
process_spaln_output/combined_spaln_output
requirements:
ResourceRequirement:
ramMin: 4096
coresMin: 1
steps:
metaeuk:
run: tools/metaeuk_easy_predict.cwl
in:
contigs: contigs_fasta
query: proteins_fasta
out:
- output_fasta
samtools_index_contigs:
run: bio-cwl-tools:samtools/samtools_faidx.cwl
in:
sequences: contigs_fasta
out:
- sequences_with_index
samtools_index_protein:
run: bio-cwl-tools:samtools/samtools_faidx.cwl
in:
sequences: proteins_fasta
out:
- sequences_with_index
extract_region_specs:
run: tools/metaeuk_to_regions.cwl
in:
metaeuk_fasta: metaeuk/output_fasta
out:
- contig_regions_files
- proteins_lists
extract_region_pairs:
requirements:
- class: ScatterFeatureRequirement
- class: SubworkflowFeatureRequirement
scatter:
- contig_region
- protein
scatterMethod: dotproduct
run: make_search_pair_workflow.cwl
in:
all_contig_fasta: samtools_index_contigs/sequences_with_index
all_protein_fasta: samtools_index_protein/sequences_with_index
contig_region: extract_region_specs/contig_regions_files
protein: extract_region_specs/proteins_lists
out:
- contig_fasta
- protein_fasta
spaln:
requirements:
- class: ScatterFeatureRequirement
scatter:
- genome_fasta
- query_fasta
scatterMethod: dotproduct
run: tools/spaln.cwl
in:
genome_fasta: extract_region_pairs/contig_fasta
query_fasta: extract_region_pairs/protein_fasta
species: species_table
output_format:
default: 0
out:
- spaln_out
process_spaln_output:
run: tools/process_spaln_output.cwl
in:
spaln_outputs: spaln/spaln_out
out:
- combined_spaln_output
$namespaces:
edam: http://edamontology.org/
bio-cwl-tools: https://raw.githubusercontent.com/common-workflow-library/bio-cwl-tools/release/
$schemas:
- http://edamontology.org/EDAM_1.18.owl