-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathinput_parameters.py
More file actions
41 lines (33 loc) · 1.32 KB
/
input_parameters.py
File metadata and controls
41 lines (33 loc) · 1.32 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
# Do NOT change these parameters (lines 2-7).
DATA_FOLDER = "/data"
MULTIFASTA_FOLDER = "Multifasta/"
IN_PROCESS_FOLDER = "in_process"
TEMP_FOLDER = "Temp/"
OUTPUT_FOLDER = "Output/"
OUTPUT_PARSNP_FOLDER = "Output_parsnp/"
# Ingroup and Outgroup folders WITHOUT path
INGROUP_FOLDER = "Ingroup_Demo"
OUTGROUP_FOLDER = "Outgroup_Demo"
# Leave None to use all genomes in the ingroup folder or specify the number of genomes to use
INGROUP_SIZE = None
# Leave None to use all genomes in the outgroup folder or specify the number of genomes to use
OUTGROUP_SIZE = None
# Filtering parameters for the parsnp alignment
MINIMUM_ALIGNMENT_LENGTH = 300 # Minimum sequence length in an alignment
# Minimum percentage of genomes that there should be an alignment values from [0,100]
MINIMUM_ALIGNMENT_COVERAGE = 99
MINIMUM_ALIGNMENT_PERCENTAGE_IDENTITY = 99
# Add the location of the parsnp file to avoid re-run parsnp
PARSNP_XMFA_FILE_LOCATION = ""
FILTERED_XMFA_FILE_LOCATION = ""
# Maximum sequence length for a sequence alignment to be blast
SEQUENCE_LENGTH = 300
SHIFT = 250
E_CUTOFF_OUTGROUP = 1
PERC_IDENTITY_OUTGROUP = 60
# Format of the input files
FORMAT = "fasta"
# Removing older output files
CLEANUP_DAYS = 60
# Maximum percentage of matches (0-100) 0 = There should be zero hits, and 100 we allow all the hits
OUTGROUP_FILTER_PERCENTAGE = 50