forked from VUmcCGP/sanefalcon
-
Notifications
You must be signed in to change notification settings - Fork 0
/
predict.py
38 lines (31 loc) · 1.45 KB
/
predict.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
# Copyright (C) 2016 VU University Medical Center Amsterdam
# Author: Roy Straver ([email protected])
#
# This file is part of SANEFALCON
# SANEFALCON is distributed under the following license:
# Attribution-NonCommercial-ShareAlike, CC BY-NC-SA (https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode)
# This license is governed by Dutch law and this license is subject to the exclusive jurisdiction of the courts of the Netherlands.
import sys
nuclData=dict()
with open(sys.argv[1],'r') as referenceFile:
correlations = [float(x) for x in referenceFile.readline().split(" ")]
scalars = [float(x) for x in referenceFile.readline().split(" ")]
#print len(correlations),scalars
with open(sys.argv[2],'r') as profileFile:
# In these readlines -1 to drop the 'end of line' comma from a previous awk
profile = [float(x) for x in profileFile.readline().split(",")[:-1]]
profile.reverse()
#profile2=([float(x) for x in profileFile.readline().split(",")[1:-1]])
profile.extend([float(x) for x in profileFile.readline().split(",")[1:-1]])
#print len(profile)
totalReads=sum(profile)
normProfile=[x/totalReads for x in profile]
summed=0
for i,val in enumerate(normProfile):
summed+=val*correlations[i]
fetalFraction = scalars[0]*summed+scalars[1]
if len(correlations) == len(normProfile):
print "Fetal Fraction:\t",fetalFraction
else:
print "ERROR: correlation and sample profiles are not aligned"
print "Nucleosome Profile:","\t".join([str(x) for x in normProfile])