forked from Armxyz1/Genomics
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmain.py
More file actions
56 lines (39 loc) · 1.74 KB
/
main.py
File metadata and controls
56 lines (39 loc) · 1.74 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
import argparse
from preprocess.process_data import get_data
from align.align_reads import align_reads
from analytics.clean_data import cleanup
from analytics.graphs import *
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Read Matching')
parser.add_argument('--bwt', type=str, help='BWT file path', default='gene_data/chrX_last_col.txt')
parser.add_argument('--map', type=str, help='Character Map file path', default='gene_data/chrX_map.txt')
parser.add_argument('--ref', type=str, help='Reference Sequence file path', default='gene_data/chrX.fa')
parser.add_argument('--reads', type=str, help='Reads file path', default='gene_data/reads')
parser.add_argument('--err_thresh', type=int, help='Error Threshold', default=2)
parser.add_argument('--save_path', type=str, help='Save Path', default='results')
args = parser.parse_args()
bwt_path = args.bwt
map_path = args.map
fa_path = args.ref
reads_path = args.reads
err_thresh = args.err_thresh
save_path = args.save_path
print("Reading Data...")
bwt, len_n, idx, reference, reads = get_data(bwt_path, map_path, fa_path, reads_path)
print("Data Read Successfully!")
print()
print("Aligning Reads...")
align_reads(bwt, len_n, idx, reference, reads, err_thresh)
print("Reads Aligned Successfully!")
print()
print("Cleaning Data...")
cleanup(save_path)
print("Data Cleaned Successfully!")
print()
print("Output saved to processed_reads.csv")
print()
print("Creating Graphs...")
read_distribution(save_path)
coverage(save_path, len(reference))
statistics(save_path)
print("Graphs Created Successfully!")