-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathconfig_1502.py
51 lines (42 loc) · 1.94 KB
/
config_1502.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
project_id = '150.2'
dry_run = False
compulsory = ['.delta', '.delta.coords']
"""
compulsory extension of files
"""
forbidden = ['.invertions.delta.q.delta', '.invertions.delta.q.delta.coords', '.fasta.delta', '.fasta.delta.coords']
#forbidden = ['.invertions.delta.q.delta', '.invertions.delta.q.delta.coords', '.fasta.delta.coords']
"""
forbidden extension of files
"""
def retAll(l):
return 'all scaffolds'
labelFields = {
'refName' : [r'(\S+?)_SL2.40ch\d+' , os.path.basename, None ],
'refChrom': [r'SL2.40ch(\d+)' , None , None ],
'tgtName' : [r'_\._(\S+)_scaffold_final\.assembly\.fasta', None , None ],
'tgtChrom': [r'(.)' , None , retAll ],
'status' : [r'\.fasta(\S+)' , None , None ]
}
"""
Regular expression to extract information from filenames
"""
titleFmt = '%(refName)s vs %(tgtChrom)s - Chromosome %(refChrom)s - %(status)s'
xlabelFmt = '%(refName)s Chromosome %(refChrom)s'
ylabelFmt = '%(tgtName)s'
"""
output format for title, xlabel and ylabel using the information extracted from file name
"""
statusMatch = {
'.delta' : 'Raw Dot Plot',
'.delta.coords' : 'Raw Dot Plot',
'.delta.q.delta' : 'Clean Dot Plot',
'.delta.q.delta.coords' : 'Clean Dot Plot',
'.delta.q.delta.filter' : 'Clean & Filtered Dot Plot',
'.delta.q.delta.filter.coords' : 'Clean & Filtered Dot Plot',
'.delta.q.delta.filter.invertions.delta' : 'Clean & Filtered Dot Plot. Only Inversions',
'.delta.q.delta.filter.invertions.delta.coords': 'Clean & Filtered Dot Plot. Only Inversions',
}
"""
mapping from extension to stage of processing of file
"""