-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathget_promoters.sh
More file actions
45 lines (26 loc) · 857 Bytes
/
get_promoters.sh
File metadata and controls
45 lines (26 loc) · 857 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
echo Enter required length for promoter region
read len
echo Enter fasta file name located in working directory
echo For example: Aedes.fa
read fasta
echo Enter gff file name located in working directory
echo For example: Aedes.gff
read gff
echo Enter gene list file name located in working directory
echo For example: search.txt
read search
sort -k1 $search > temp.search
cp -f temp.search $search
echo "$(<$search)"
samtools faidx $fasta
cut -f 1,2 $fasta.fai > chrom.sizes
gff2bed < $gff > temp.bed
bedtools flank -i temp.bed -g chrom.sizes -l $len -r 0 -s > tempUp.bed
grep -f temp.search tempUp.bed | grep protein_coding_gene | cut -f 1,2,3,10 > selected.bed
sort -k4 selected.bed > sorted.bed
echo "$(<sorted.bed)"
bedtools getfasta -fi Aedes.fa -bed sorted.bed > upstream.fa
rm temp.bed
rm tempUp.bed
rm sorted.bed
rm selected.bed