-
Notifications
You must be signed in to change notification settings - Fork 0
/
run_SweepFinder.py
62 lines (47 loc) · 1.79 KB
/
run_SweepFinder.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
# -*- coding: utf-8 -*-
"""
Created on Wed Aug 26 14:07:56 2015
@author: RJovelin
"""
from accessories import *
from sites_with_coverage import *
import os
# get the allele counts for all sites with coverage, exclude sites with sample size < 10
# [chromo: {site : [ref_allele, alt_allele, count_ref, count alt]}]
chromo_sites = get_non_coding_snps('../SNP_files/', 10)
print('got allele counts in genome')
# make a list of positions for scaffold_144
positions = [i for i in chromo_sites['scaffold_144']]
# sort list
positions.sort()
# make input file
newfile = open('testfileSweepFinder.txt', 'w')
# write header
newfile.write('position' + '\t' + 'x' + '\t' + 'n' + '\t' + 'folded' + '\n')
for i in positions:
ref_count = chromo_sites['scaffold_144'][i][2]
alt_count = chromo_sites['scaffold_144'][i][3]
if ref_count != 0 and alt_count != 0:
# site is polymorphic
# find minor allele
ref = chromo_sites['scaffold_144'][i][0]
alt = chromo_sites['scaffold_144'][i][1]
if alt_count + ref_count >= 45:
if alt_count <= ref_count:
# alt is minor
x = alt_count
elif ref_count < alt_count:
# ref is minor
x = ref_count
n = ref_count + alt_count
newfile.write('\t'.join([str(i+1), str(x), str(n), '1']) + '\n')
newfile.close()
# get the gridsize paramater
genome = convert_fasta('../CREM_CLA_protein_divergence/noamb_356_v1_4.txt')
GRIDSIZE = int(len(genome['scaffold_144']) / 26)
print(GRIDSIZE)
#os.system('cp testfileSweepFinder.txt ~/SF')
#os.chdir('../../SF')
# run SweepFinder
os.system('SweepFinder2 -sg 1000 testfileSweepFinder.txt testfileSFoupoutscaffold144.txt')
#os.system('cp testfileSFoupoutscaffold144.txt ../CREM_POP_GENOMICS/Sweep_Finder_remanei/')