forked from broadinstitute/ABC-Enhancer-Gene-Prediction
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathjuicebox_dump.py
executable file
·54 lines (45 loc) · 2.51 KB
/
juicebox_dump.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
import argparse
import subprocess
from tools import run_command
def parseargs():
parser = argparse.ArgumentParser(description='Download and dump HiC data')
parser.add_argument('--hic_file', required=True, help="Path or url to .hic file.")
parser.add_argument('--juicebox', required=True, default="", help="path to juicebox executable or java command invoking juicer_tools.jar. eg: 'java -jar juicer_tools.jar'")
parser.add_argument('--resolution', default=5000, help="Resolution of HiC to download. In units of bp.")
parser.add_argument('--outdir', default=".")
parser.add_argument('--include_raw', action="store_true", help="Download raw matrix in addtion to KR")
parser.add_argument('--chromosomes', default="all", help="comma delimited list of chromosomes to download")
parser.add_argument('--skip_gzip', action="store_true", help="dont gzip hic files")
return parser.parse_args()
def main(args):
if args.chromosomes == "all":
chromosomes = list(range(1,23)) + ['X']
else:
chromosomes = args.chromosomes.split(",")
for chromosome in chromosomes:
print("Starting chr" + str(chromosome) + " ... ")
outdir = "{0}/chr{1}/".format(args.outdir, chromosome)
command = "mkdir -p " + outdir
out = subprocess.getoutput(command)
## Download observed matrix with KR normalization
command = args.juicebox + " dump observed KR {0} {1} {1} BP {3} {2}/chr{1}.KRobserved".format(args.hic_file, chromosome, outdir, args.resolution)
print(command)
out = subprocess.getoutput(command)
if not args.skip_gzip:
run_command("gzip {0}/chr{1}.KRobserved".format(outdir, chromosome))
## Download KR norm file
command = args.juicebox + " dump norm KR {0} {1} BP {3} {2}/chr{1}.KRnorm".format(args.hic_file, chromosome, outdir, args.resolution)
out = subprocess.getoutput(command)
print(command)
if not args.skip_gzip:
run_command("gzip {0}/chr{1}.KRnorm".format(outdir, chromosome))
if args.include_raw:
## Download raw observed matrix
command = args.juicebox + " dump observed NONE {0} {1} {1} BP {3} {2}/chr{1}.RAWobserved".format(args.hic_file, chromosome, outdir, args.resolution)
print(command)
out = subprocess.getoutput(command)
if not args.skip_gzip:
run_command("gzip {0}/chr{1}.RAWobserved".format(outdir, chromosome))
if __name__ == '__main__':
args = parseargs()
main(args)