-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathprojectvars_template.sh
123 lines (85 loc) · 3.24 KB
/
projectvars_template.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
##
########## RUN INFORMATION ##########
# Run identifier:
export RUNID="RUN_00";
# Samples suffix:
export R1="_R1_001"
export R2="_R2_001"
########## OPTIONS AND VARIABLES ##########
# Computation:
export NCPUS=32
# Assembly:
export minconlen=100; #Minimum contigs length
#blast
export DBsize=5000000000;
########## PROJECT PATHS AND FILESYSTEM ##########
# Base "root" dir
export RDIR="dir/to/MYPROJECT";
# directory where to find nextflow scripts and config files.
export NXFDIR="${RDIR}/CAPTVRED";
# Directory with the data: samples_definition.tbl, rawseqs_fastq dir, ...
export BDIR="${RDIR}/${RUNID}"; #NEXTFLOW MUST BE RUN FROM THIS DIRECTORY
#samples_definition.tbl must be placed in this folder.
#projectvars.sh must be placed in this folder
#Reference sequences and databases:
export REFSQSD="${RDIR}/REFSEQS"
## Viral candidates
export AMPSQD="${REFSQSD}/ampliconseqs"; #directory that contains the fasta file of refseqs.
export AMPSQFA="Viral_candidates_zoonosis.fa.gz"; #Name of the compressed fasta file that contians the sequences of all amplicons used to design the probes.
export AMPSQINFO="Viral_candidates_zoonosis_full_info.tsv";
export AMPGFFD=""; #directory that contains the gff file of refseqs.
## Blast databases
export BL_DB_D="${REFSQSD}/rvdb_nt" #Blast ref database directory
export BL_DB_NM="C-RVDBvCurrent.fasta.gz"
export BL_DB_IF="C-RVDB_allentries_info.txt"
#Kaiju databases
export KAI_DB_D="${REFSQSD}/kaijudb"; #Directory where the kaiju databases are installed
export KAI_DB_NM="nr_euk";
export KAI_DB_NMraw="rvdb";
#BBduk resources
export BBDUK_RES="${REFSQSD}/bbmap/resources" # resources required for bbduk.sh to work
# Handle potential contamination:
contamin_ids=""; #NCBI identifiers of the refseqs of the potential contaminant sequence.
contamin_faa=""; #Protein fasta file of the potentially contaminant sequence.
# PATH (directories where used programes are installed):
#export BBDUK_PATH="/usr/local/install/bbmap";
# Filesystem required by workflow:
#Do not modify!!
#scripts directory:
export BIND="$NXFDIR/bin"
export TMPD="$BDIR/tmp"
mkdir -vp $TMPD
export RAWFQ="$BDIR/rawseqs_fastq"
mkdir -vp $RAWFQ
#fastq data mult be placed here before running nextflow.
export CLNDIR="$BDIR/cleanseqs"
mkdir -vp $CLNDIR
export AMPALD="$BDIR/amplicons_alignment"; #amplicons alignment directory
mkdir -vp $AMPALD
export ASSBLD="$BDIR/assembly"; #assembly directory
mkdir -vp $ASSBLD/megahit
mkdir -vp $ASSBLD/trinity
export CBLASTD="$BDIR/contigs_blast";
mkdir -vp $CBLASTD/blastn
mkdir -vp $CBLASTD/tblastx
export TAXDIR="$BDIR/taxonomy";
mkdir -vp $TAXDIR/reads_taxon
mkdir -vp $TAXDIR/contigs_taxon/blastn
mkdir -vp $TAXDIR/contigs_taxon/tblastx
mkdir -vp $TAXDIR/contigs_taxon/kaiju
mkdir -vp $TAXDIR/taxon_viral_candidates
export RPTD="$BDIR/reports";
mkdir -vp $RPTD;
mkdir -vp $RPTD/coverage_figures
export LOGD="$BDIR/logs";
mkdir -vp $LOGD
#Do not modify!!
##
## NextFlow
# directory where working files are stored
export NXF_HOME="$BDIR/.nextflow";
export NXF_WORK="$BDIR/work";
export NXF_HTML="$RPTD/$RUNID.html";
export NXF_TIMELINE="$RPTD/${RUNID}_timeline.html";
export NXF_DAG="$RPTD/${RUNID}_dag.dot";
# mkdir -vp $NXF_HOME $NXF_WORK; # those folders are created automatically by NextFlow