-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathscore_validate.sh
More file actions
executable file
·19 lines (14 loc) · 953 Bytes
/
score_validate.sh
File metadata and controls
executable file
·19 lines (14 loc) · 953 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
#!/bin/bash
# Classes construction - 84th 1000Gp1; 100th - ExAC
cut -f 3,4 scores_dbNSFP_narrow | grep -v '1000G_AF' | awk '{ if ($1 != "." && $2 != ".") print $1, int($2/0.01) }' > scores_PROVEAN
# grep -v '1000Gp1' SIFT | grep -P '^T.*\d.*' > false_class
# grep -v '1000Gp1' SIFT | grep -P '^D.*\d.*' > true_class
# Binning
# awk '{ print $2, int($2/0.01) }' false_class | sort -n | uniq -c > FC_binned
# Cleanup and formatting
# perl -pe 's|^ +||' TC_binned | awk -F ' ' '{ print $2, $1 }' | sed 's/ /\t/' | head -n 51 > TC.cleaned
# perl -pe 's|^ +||' FC_binned | awk -F ' ' '{ print $2, $1 }' | sed 's/ /\t/' | head -n 51 > FC.cleaned
# Making final table
# cut -f 2 FC.cleaned | paste TC.cleaned - > cc.SIFT.classified.cleaned
# RMA stuff - 8th 1000G, 9th ExAC
# cut -d ',' -f 8 ../final_file/predictedRMA | awk '{ print int($1/0.01) }' | sort -n | uniq -c | perl -pe 's|^ +||' | awk -F ' ' '{ print $2, $1 }' | sed 's/ /\t/' > RMA.cleaned