-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathfavites_lite.py
executable file
·139 lines (129 loc) · 6.36 KB
/
favites_lite.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
#! /usr/bin/env python3
'''
FAVITES-Lite
Niema Moshiri 2022
'''
# useful constants
RNG_SEED_MIN = 0
RNG_SEED_MAX = 2147483647
# general imports and load global.json
from os import makedirs, remove
from os.path import abspath, expanduser, isdir, isfile, realpath
from shutil import rmtree
from sys import argv, stderr
from time import time
import json
import random
GLOBAL_JSON_PATH = "%s/global.json" % '/'.join(abspath(realpath(expanduser(__file__))).split('/')[:-1])
GLOBAL = json.loads(open(GLOBAL_JSON_PATH).read())
# external imports
try:
import numpy
except:
error("Unable to import numpy. Install with: pip install numpy")
# FAVITES-Lite-specific imports
from plugins import PLUGIN_FUNCTIONS
from plugins.common import *
# parse user args
def parse_args():
import argparse
parser = argparse.ArgumentParser(description=__doc__, formatter_class=argparse.ArgumentDefaultsHelpFormatter)
parser.add_argument('-c', '--config', required=True, type=str, help="FAVITES-Lite Config File")
parser.add_argument('-o', '--output', required=True, type=str, help="Output Directory")
parser.add_argument('--overwrite', action="store_true", help="Overwrite output directory if it exists")
parser.add_argument('--rng_seed', required=False, type=int, default=None, help="Random Number Generator Seed")
parser.add_argument('--quiet', action="store_true", help="Suppress Log Messages")
parser.add_argument('--version', action="store_true", help="Show FAVITES-Lite version")
return parser.parse_args()
# validate user args
def validate_args(args, verbose=True):
# check RNG seed
if args.rng_seed is None:
args.rng_seed = random.randint(RNG_SEED_MIN, RNG_SEED_MAX)
elif args.rng_seed < RNG_SEED_MIN or args.rng_seed > RNG_SEED_MAX:
error("Invalid RNG seed (%s). Must be in the range [%d, %d]" % (args.rng_seed, RNG_SEED_MIN, RNG_SEED_MAX))
GLOBAL['RNG_SEED'] = args.rng_seed; random.seed(GLOBAL['RNG_SEED']); numpy.random.seed(GLOBAL['RNG_SEED'])
if verbose:
print_log("RNG Seed: %d" % GLOBAL['RNG_SEED'])
# check config file
if not isfile(args.config):
error("Config file not found: %s" % args.config)
if verbose:
print_log("Config File: %s" % args.config)
# check output directory
if isdir(args.output) or isfile(args.output):
if args.overwrite or input('Output directory exists: "%s". Overwrite? (Y/N) ' % args.output).upper().startswith('Y'):
if verbose:
print_log("Overwriting output directory: %s" % args.output)
if isdir(args.output):
rmtree(args.output)
else:
remove(args.output)
else:
error("Didn't overwrite output directory: %s" % args.output)
elif verbose:
print_log("Output Directory: %s" % args.output)
# validate FAVITES-Lite config
def validate_config(config):
for step in GLOBAL['CONFIG_KEYS']:
if step not in config:
error("Invalid config file: Missing step: %s" % step)
if 'model' not in config[step]:
error("Invalid config file: Missing model in step: %s" % step)
model = config[step]['model']
if 'REQS' in GLOBAL['MODELS'][step][model]:
for req_step in GLOBAL['MODELS'][step][model]['REQS']:
if config[req_step]['model'] != GLOBAL['MODELS'][step][model]['REQS'][req_step]:
error('Invalid config file: Step "%s" model "%s" requires step "%s" model "%s", but you selected: %s' % (step, model, req_step, GLOBAL['MODELS'][step][model]['REQS'][req_step], config[req_step]['model']))
for p in GLOBAL['MODELS'][step][model]['PARAM']:
if p not in config[step]['param']:
error('Invalid config file: Missing parameter for step "%s" model "%s": %s' % (step, model, p))
if len(config[step]['param']) != len(GLOBAL['MODELS'][step][model]['PARAM']):
error('Invalid config file: Too many parameters for step "%s" model "%s"' % (step, model))
# run FAVITES-Lite
if __name__ == "__main__":
if len(argv) > 1 and argv[1].lower().lstrip('-') == 'version':
print("FAVITES-Lite v%s" % GLOBAL['VERSION']); exit()
start_time = time()
args = parse_args(); verbose = not args.quiet
if verbose:
print_log("=== FAVITES-Lite v%s ===" % GLOBAL['VERSION'])
print_log("Command: %s" % ' '.join(argv))
validate_args(args, verbose=verbose)
config = json.loads(open(args.config).read()); validate_config(config)
makedirs(args.output); f = open("%s/config.json" % args.output, 'w'); json.dump(config, f); f.close()
out_fn = {
'intermediate': "%s/intermediate_files" % args.output,
'contact_network': "%s/contact_network.tsv" % args.output,
'transmission_network': "%s/transmission_network.tsv" % args.output,
'all_state_transitions': "%s/all_state_transitions.tsv" % args.output,
'sample_times': "%s/sample_times.tsv" % args.output,
'viral_phylogeny_all_chains_time': "%s/intermediate_files/viral_phylogeny_all_chains_time.nwk" % args.output,
'viral_phylogeny_seed_time': "%s/intermediate_files/viral_phylogeny_seed_time.nwk" % args.output,
'viral_phylogeny_time': "%s/phylogeny.time.nwk" % args.output,
'viral_phylogeny_mut': "%s/phylogeny.mutations.nwk" % args.output,
'ancestral_seq': "%s/ancestral_sequence.fas" % args.output,
'sequences': "%s/sequences.fas" % args.output,
}
makedirs(out_fn['intermediate'])
if verbose:
print_log("Intermediate Files: %s" % out_fn['intermediate'])
for step in GLOBAL['CONFIG_KEYS']:
if verbose:
print_log(); print_log("=== %s ===" % step)
model = config[step]['model'].strip()
if verbose:
print_log("Model: %s" % model)
params = config[step]['param']
if verbose:
for p in GLOBAL['MODELS'][step][model]['PARAM']:
print_log("Parameter: %s: %s" % (p, params[p]))
if step not in PLUGIN_FUNCTIONS:
error("Step not implemented yet: %s" % step)
if model not in PLUGIN_FUNCTIONS[step]:
error("%s model not implemented yet: %s" % (step, model))
PLUGIN_FUNCTIONS[step][model](params, out_fn, config, GLOBAL, verbose=verbose)
end_time = time()
if verbose:
print_log(); print_log("=== Completion ===")
print_log("Total runtime: %s seconds" % (end_time-start_time))