-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathMakeBulkRnaSeqNextflowConfig.pm
More file actions
107 lines (87 loc) · 3.86 KB
/
MakeBulkRnaSeqNextflowConfig.pm
File metadata and controls
107 lines (87 loc) · 3.86 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
package ApiCommonWorkflow::Main::WorkflowSteps::MakeBulkRnaSeqNextflowConfig;
@ISA = (ApiCommonWorkflow::Main::WorkflowSteps::WorkflowStep);
use warnings;
use strict;
use ApiCommonWorkflow::Main::WorkflowSteps::WorkflowStep;
sub run {
my ($self, $test, $undo) = @_;
#NOTE: the subset size here would run "X" number of genomic sequences at a time on the cluster (chromosomes or contigs)
my $fastaSubsetSize = 5;
my $resultsDirectory = $self->getParamValue("resultsDirectory");
my $sampleSheet = $self->getParamValue("sampleSheetFile");
my $gtfFile = $self->getParamValue("gtfFile");
my $genomeFile = $self->getParamValue("genomeFile");
my $nextflowConfigFile = $self->getParamValue("nextflowConfigFile");
my $isStranded = $self->getBooleanParamValue("isStranded") ? "true" : "false";
my $intronLength = $self->getParamValue("maxIntronLength");
my $cdsOrExon = $self->getParamValue("cdsOrExon");
my $organismAbbrev = $self->getParamValue("organismAbbrev");
my $workflowDataDir = $self->getWorkflowDataDir();
my $workingDirRelativePath = $self->getParamValue("workingDirRelativePath");
my $digestedSampleSheetPath = $self->relativePathToNextflowClusterPath($workingDirRelativePath, $sampleSheet);
my $digestedGtfFilePath = $self->relativePathToNextflowClusterPath($workingDirRelativePath, $gtfFile);
my $digestedGenomeFilePath = $self->relativePathToNextflowClusterPath($workingDirRelativePath, $genomeFile);
my $digestedOutputDir = $self->relativePathToNextflowClusterPath($workingDirRelativePath, $resultsDirectory);
my $clusterServer = $self->getSharedConfig('clusterServer');
my $clusterWorkflowDataDir = $self->getClusterWorkflowDataDir();
my $executor = $self->getClusterExecutor();
my $lsfEnv = $self->getNextflowLsfScratchEnvBlock();
my $clusterConfigFile = "\$baseDir/conf/${executor}.config";
if ($undo) {
$self->runCmd(0, "rm $workflowDataDir/$nextflowConfigFile");
} else {
my $nextflowConfig = "$workflowDataDir/$nextflowConfigFile";
open(F, ">$nextflowConfig") || die "Can't open task prop file '$nextflowConfig' for writing";
my $configString = <<NEXTFLOW;
params {
fasta = "$digestedGenomeFilePath"
gtf = "$digestedGtfFilePath"
input = "$digestedSampleSheetPath"
outdir = "$digestedOutputDir"
isStranded = $isStranded
intronLength = $intronLength
cdsOrExon = "$cdsOrExon"
useExistingIndex = false
genome = "$organismAbbrev"
}
includeConfig "\$baseDir/conf/nfcore_boilerplate.config"
includeConfig "$clusterConfigFile"
process {
maxForks = 10
}
def check_max(obj, type) {
if (type == 'memory') {
try {
if (obj.compareTo(params.max_memory as nextflow.util.MemoryUnit) == 1)
return params.max_memory as nextflow.util.MemoryUnit
else
return obj
} catch (all) {
println " ### ERROR ### Max memory '\${params.max_memory}' is not valid! Using default value: \$obj"
return obj
}
} else if (type == 'time') {
try {
if (obj.compareTo(params.max_time as nextflow.util.Duration) == 1)
return params.max_time as nextflow.util.Duration
else
return obj
} catch (all) {
println " ### ERROR ### Max time '\${params.max_time}' is not valid! Using default value: \$obj"
return obj
}
} else if (type == 'cpus') {
try {
return Math.min( obj, params.max_cpus as int )
} catch (all) {
println " ### ERROR ### Max cpus '\${params.max_cpus}' is not valid! Using default value: \$obj"
return obj
}
}
}
NEXTFLOW
print F $configString . $lsfEnv;
close(F);
}
}
1;