-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathprocessFinderResults.sh
81 lines (55 loc) · 2.02 KB
/
processFinderResults.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
#!/bin/bash
if [ $# -ne 1 ]
then
echo "usage $0 <chrom>"
exit 1
fi
CHR=$1
# find total num vus in a clean file
cat $CHR-out.json | python -m json.tool > $CHR-pretty.json
grep '(' $CHR-pretty.json > ${CHR}.txt
sed -i 's/\ \ \ \ \ \ \ \ \"//' ${CHR}.txt
sed -i 's/\".*//' ${CHR}.txt
cat ${CHR}.txt | sort | uniq > $CHR-uniq.txt
numVUS=$(wc -l $CHR-uniq.txt|awk '{print $1}')
# find total num cooc vus
sed -n '/cooccurring vus/,/homozygous vus/p' $CHR-pretty.json > $CHR-coocs.json
grep '(' $CHR-coocs.json > $CHR-coocs.txt
sed -i 's/\ \ \ \ \ \ \ \ \"//' $CHR-coocs.txt
sed -i 's/\".*//' $CHR-coocs.txt
cat $CHR-coocs.txt | sort > $CHR-coocs-sorted.txt
numCoocs=$(wc -l $CHR-coocs-sorted.txt|awk '{print $1}')
# find total num homo vus
sed -n '/homozygous vus/,$ p' $CHR-pretty.json > $CHR-homo.json
grep '(' $CHR-homo.json > $CHR-homo.txt
sed -i 's/\ \ \ \ \ \ \ \ \"//' $CHR-homo.txt
sed -i 's/\".*//' $CHR-homo.txt
cat $CHR-homo.txt | sort > $CHR-homo-sorted.txt
numHomo=$(wc -l $CHR-homo-sorted.txt|awk '{print $1}')
# find unique and intersecting counts
# comm -123 (1 = suppress unique to f1, 2 => suppress unique to f2, 3=>suppress in both)
comm -23 $CHR-coocs-sorted.txt $CHR-homo-sorted.txt > $CHR-only-coocs.txt
numOnlyCooc=$(wc -l $CHR-only-coocs.txt | awk '{print $1}')
comm -13 $CHR-coocs-sorted.txt $CHR-homo-sorted.txt > $CHR-only-homo.txt
numOnlyHomo=$(wc -l $CHR-only-homo.txt | awk '{print $1}')
comm -12 $CHR-homo-sorted.txt $CHR-coocs-sorted.txt > $CHR-both.txt
numIntersection=$(wc -l $CHR-both.txt | awk '{print $1}')
echo "new int = $numIntersection"
((numIntersection=$numVUS - $numOnlyCooc - $numOnlyHomo))
echo "total VUS = $numVUS"
echo "num only cooccuring = $numOnlyCooc"
echo "num only homozygous = $numOnlyHomo"
echo "num of intersection = $numIntersection"
# cleanup files
rm $CHR-coocs-sorted.txt
rm $CHR-homo-sorted.txt
rm $CHR-homo.txt
rm $CHR-coocs.txt
rm $CHR-homo.json
rm $CHR-coocs.json
rm $CHR-pretty.json
rm $CHR-uniq.txt
rm ${CHR}.txt
#rm $CHR-only-coocs.txt
#rm $CHR-only-homo.txt
#rm $CHR-both.txt