-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSnakefile4
46 lines (34 loc) · 1.6 KB
/
Snakefile4
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
import os
import pandas as pd
from pprint import pprint
EMAIL = "alexanderytong@gmail.com"
FILE = 'runs/vacs_runs.csv'
def get_files(wildcards):
runs = pd.read_csv(FILE)
return list(runs.path)
def get_score_files(wildcards):
runs = pd.read_csv(FILE)
return [os.path.join(os.path.split(path)[0], 'scores.npy') for path in runs.path]
rule:
input: get_score_files
rule train:
output: "{prefix}/{dataset}2/{model}/{class}/{seed}/{frac_corrupt}/model.json"
shell: "python train_all3.py {wildcards.prefix} {wildcards.dataset}2 {wildcards.model} {wildcards.class} {wildcards.seed} {wildcards.frac_corrupt} 256 20000"
rule predict_models:
input: rules.train.output
output: "{prefix}/{dataset}2/{model}/{class}/{seed}/{frac_corrupt}/scores.npy"
shell: "CUDA_VISIBLE_DEVICES='' python score_all3.py {wildcards.prefix} {wildcards.dataset}2 {wildcards.model} {wildcards.class} {wildcards.seed} {wildcards.frac_corrupt}"
rule predict_baseline:
output: "{prefix}/{dataset}2/shallow_{model}/{class}/{seed}/{frac_corrupt}/scores.npy"
shell: "python train_baseline3.py {wildcards.prefix} {wildcards.dataset}2 {wildcards.model} {wildcards.class} {wildcards.seed} {wildcards.frac_corrupt}"
ruleorder: predict_baseline > predict_models
rule accumulate_scores:
input:
scores = get_score_files,
program = 'accumulate_scores.py'
output: "{prefix}/{dataset}/all_scores.pkl"
shell: "python {input.program} {input.scores} {output}"
onsuccess:
shell("mail -s 'Snakemake Completed!' %s < {log}" % EMAIL)
onerror:
shell("mail -s 'Snakemake Error' %s < {log}" % EMAIL)