-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathMapping_to_gorilla_Y_transcripts.sh
26 lines (21 loc) · 1.35 KB
/
Mapping_to_gorilla_Y_transcripts.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
#!/bin/bash
#SBATCH --job-name=marta
#SBATCH --output=marta-%j.out
#SBATCH --error=marta-%j.err
#SBATCH -C new
#SBATCH --nodes=1
#SBATCH --ntasks=20
#SBATCH --mem=500G
makeblastdb -in Y_gorilla_transcripts.fa -title Y_gorilla_transcripts -dbtype nucl -out Y_gorilla_transcripts -parse_seqids
SAMPLE_path=/nfs/brubeck.bx.psu.edu/scratch6/marta/Capture_great_apes/All_samples/overhang/new_barcodes/IsoCon_15/annotate_clusters
output_path=/nfs/brubeck.bx.psu.edu/scratch6/marta/Capture_great_apes/All_samples/overhang/new_barcodes/IsoCon_15/annotate_clusters/blastn_query_gorilla_Y_transcripts
db_path=/nfs/brubeck.bx.psu.edu/scratch6/marta/Capture_great_apes/All_samples/overhang/new_barcodes/IsoCon_15/annotate_clusters/db_gorilla_transcripts
mkdir -p $output_path
for SAMPLE in 1 2 3 4 5 6 7 8
do
for GENE in BPY2 CDY DAZ HSFY PRY RBMY TSPY VCY_chimp_bonobo VCY_human XKRY
do
blastn -query $db_path/Y_gorilla_transcripts.fa -db $SAMPLE_path/$SAMPLE/$GENE/shared_transcripts -out $output_path/$SAMPLE\_$GENE\_reverse_results_blastn.txt -evalue 1e-30 -outfmt 11
blast_formatter -archive $output_path/$SAMPLE\_$GENE\_reverse_results_blastn.txt -outfmt "6 qseqid sseqid qcovs length pident evalue bitscore mismatch gaps qstart qend sstart send qseq sseq" -out $output_path/$SAMPLE\_$GENE\_results_blastn_query_gorilla_Y_transcripts_tabular.txt
done
done