-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathtest_MLclassifier.py
59 lines (42 loc) · 2.1 KB
/
test_MLclassifier.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
import os
import pytest
from VCF.VCFfilter.MLclassifier import MLclassifier
def test_train_snps(datadir):
"""
Train the model for SNPs
"""
ML_obj = MLclassifier()
outfile = ML_obj.train(outprefix="{0}/outdir/fitted_logreg_snps".format(datadir),
tp_annotations="{0}/TP_annotations_snps.chr20.tsv".format(datadir),
fp_annotations="{0}/FP_annotations_snps.chr20.tsv".format(datadir))
assert os.path.isfile(outfile) is True
def test_train_snps_gz(datadir):
"""
Train the model for SNPs using 2 gzipped annotation files
"""
ML_obj = MLclassifier()
outfile = ML_obj.train(outprefix="{0}/outdir/fitted_logreg_snps".format(datadir),
tp_annotations="{0}/TP_annotations_snps.chr20.tsv.gz".format(datadir),
fp_annotations="{0}/FP_annotations_snps.chr20.tsv.gz".format(datadir))
def test_train_indels(datadir):
"""
Train the model for INDELs
"""
ML_obj = MLclassifier()
outfile = ML_obj.train(outprefix="{0}/outdir/fitted_logreg_indels".format(datadir),
tp_annotations="{0}/TP_annotations_indels.chr20.tsv".format(datadir),
fp_annotations="{0}/TP_annotations_indels.chr20.tsv".format(datadir))
assert os.path.isfile(outfile) is True
def test_apply_model(clean_tmp, datadir):
ML_obj = MLclassifier(fitted_model="{0}/outdir/fitted_logreg_snps.sav".format(datadir))
outfile = ML_obj.predict(outprefix="{0}/outdir/predictions".format(datadir),
annotation_f="{0}/TP_annotations_snps.chr20.tsv".format(datadir),
cutoff=0.95)
assert os.path.isfile(outfile) is True
def test_rfe(datadir, clean_tmp):
ML_obj = MLclassifier()
select_feats_report = ML_obj.rfe(tp_annotations="{0}/TP_annotations_indels.chr20.tsv".format(datadir),
fp_annotations="{0}/TP_annotations_indels.chr20.tsv".format(datadir),
n_features=5,
outreport="{0}/outdir/out_rfe.txt".format(datadir))
assert os.path.isfile(select_feats_report) is True