-
Notifications
You must be signed in to change notification settings - Fork 1
/
Mapping_to_orangutan_Y_transcripts.sh
28 lines (22 loc) · 1.47 KB
/
Mapping_to_orangutan_Y_transcripts.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
#Mapping merged shared transcripts per sample per gene family to publicly available orangutan Y chromosome transcripts
#!/bin/bash
#SBATCH --job-name=marta
#SBATCH --output=marta-%j.out
#SBATCH --error=marta-%j.err
#SBATCH -C new
#SBATCH --nodes=1
#SBATCH --ntasks=20
#SBATCH --mem=500G
makeblastdb -in Y_orangutan_transcripts.fa -title Y_orangutan_transcripts -dbtype nucl -out Y_orangutan_transcripts -parse_seqids
SAMPLE_path=/nfs/brubeck.bx.psu.edu/scratch6/marta/Capture_great_apes/All_samples/overhang/new_barcodes/IsoCon_15/annotate_clusters
output_path=/nfs/brubeck.bx.psu.edu/scratch6/marta/Capture_great_apes/All_samples/overhang/new_barcodes/IsoCon_15/annotate_clusters/blastn_query_orang_Y_transcripts
db_path=/nfs/brubeck.bx.psu.edu/scratch6/marta/Capture_great_apes/All_samples/overhang/new_barcodes/IsoCon_15/annotate_clusters/db_orang_transcripts
mkdir -p $output_path
for SAMPLE in 1 2 3 4 5 6 7 8
do
for GENE in BPY2 CDY DAZ HSFY PRY RBMY TSPY VCY_chimp_bonobo VCY_human XKRY
do
blastn -query $db_path/Y_orangutan_transcripts.fa -db $SAMPLE_path/$SAMPLE/$GENE/shared_transcripts -out $output_path/$SAMPLE\_$GENE\_reverse_results_blastn.txt -evalue 1e-30 -outfmt 11
blast_formatter -archive $output_path/$SAMPLE\_$GENE\_reverse_results_blastn.txt -outfmt "6 qseqid sseqid qcovs length pident evalue bitscore mismatch gaps qstart qend sstart send qseq sseq" -out $output_path/$SAMPLE\_$GENE\_results_blastn_query_orang_Y_transcripts_tabular.txt
done
done